diff --git b/BeNePar/DataPreparation.ipynb a/BeNePar/DataPreparation.ipynb new file mode 100644 index 0000000..cd2148f --- /dev/null +++ a/BeNePar/DataPreparation.ipynb @@ -0,0 +1,175 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "5cd26f6f", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "from datasets import load_dataset\n", + "\n", + "from IPython.display import display\n", + "\n", + "import sys\n", + "sys.path.append('../')\n", + "from neural_parser import hybrid_tree_utils" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "fecef4af", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "d6fc0deda216433982f304d7451158b2", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/3 [00:00<?, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "pdbc_dataset = load_dataset('../pdb_c_beta/')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "23da801f", + "metadata": {}, + "outputs": [], + "source": [ + "BRACKETS_DIR = 'brackets'\n", + "! rm -r {BRACKETS_DIR}\n", + "! mkdir {BRACKETS_DIR}" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "c105feff", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "train\n", + " brackets/pdbc-cont-train.dat\n", + " 15903\n", + "validation\n", + " brackets/pdbc-cont-validation.dat\n", + " 1980\n", + "test\n", + " brackets/pdbc-cont-test.dat\n", + " 1990\n" + ] + } + ], + "source": [ + "features = pdbc_dataset['train'].features\n", + "\n", + "for part, dataset in pdbc_dataset.items():\n", + " print(part)\n", + " b_cont = []\n", + " for sentence in dataset:\n", + " tree = hybrid_tree_utils.tree_from_dataset_instance(sentence, features)\n", + " if tree.is_continuous():\n", + " b_cont.append(f'(TOP {tree.to_brackets(morph_tags=True)})')\n", + " filepath = os.path.join(BRACKETS_DIR, f'pdbc-cont-{part}.dat')\n", + " with open(filepath, 'w') as f:\n", + " print(' ', filepath)\n", + " print(' ', len(b_cont))\n", + " for row in b_cont:\n", + " print(row, file=f)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "c849233c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " 1990 121784 1024525 brackets/pdbc-cont-test.dat\n", + " 15903 1022627 8620535 brackets/pdbc-cont-train.dat\n", + " 1980 126288 1065593 brackets/pdbc-cont-validation.dat\n", + " 19873 1270699 10710653 total\n" + ] + } + ], + "source": [ + "! wc {BRACKETS_DIR}/*.dat" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "679b9f10", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(TOP (ROOT (*S (S (NP (AdjP (*Adj (adj:sg:nom:f:pos Skośnooka))) (*NP (*N (subst:sg:nom:f dziewczynka)))) (*VP (*V (fin:sg:ter:imperf trzyma))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:pl:loc:f rękach)))) (NP (AdjP (*Adj (adj:pl:nom:f:pos drewniane))) (*NP (*N (subst:pl:nom:f pałeczki))))) (Punct (interp ,)) (*Conj (conj a)) (S (PrepNP (*Prep (prep:inst:nwok przed)) (NP (*N (ppron3:sg:inst:f:ter:akc:praep nią)))) (*VP (*V (fin:pl:ter:imperf znajdują))) (Part (part się)) (NP (*NP (*N (subst:pl:nom:n:ncol naczynia))) (AdjP (*Adj (adj:pl:nom:n:pos kuchenne)))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:n:col Dziecko))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (AdjP (*Adj (adj:sg:loc:f:pos różowej))) (*NP (*N (subst:sg:loc:f opasce)))))) (*VP (*V (fin:sg:ter:imperf unosi))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:pl:loc:f rękach)))) (NP (AdjP (*Adj (adj:pl:acc:m3:pos drewniane))) (*NP (*N (subst:pl:acc:m3 patyczki)))) (PrepNP (*Prep (prep:inst:nwok nad)) (NP (AdjP (*AdjP (*Adj (ppas:pl:inst:n:perf:aff postawionymi))) (NP (PrepNP (*Prep (prep:gen do)) (NP (*N (subst:sg:gen:f góry)))) (*NP (*N (subst:sg:inst:n:ncol dnem))))) (*NP (NP (*N (subst:sg:inst:f miską))) (*Conj (conj i)) (NP (*N (subst:sg:inst:m3 garnkiem))))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:pl:nom:m1 Zawodnicy))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:n:ncol pobliżu))) (NP (*N (subst:sg:gen:f piłki)))))) (*VP (*V (fin:pl:ter:imperf przepychają))) (Part (part się)) (PrepNP (*Prep (prep:inst między)) (NP (*N (siebie:inst sobą)))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:n:ncol boisku))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (S (NP (*NP (*N (subst:sg:nom:f Dziewczynka))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:sg:loc:f sukience))))) (*VP (*V (fin:sg:ter:imperf puszcza))) (NP (*NP (*N (subst:pl:acc:f bańki))) (AdjP (*Adj (adj:pl:acc:f:pos mydlane)))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f trawie))))) (Punct (interp ,)) (*Conj (conj a)) (S (PrepNP (*Prep (prep:inst za)) (NP (*N (ppron3:sg:inst:f:ter:akc:praep nią)))) (*VP (*V (fin:sg:ter:imperf stoi))) (NP (AdjP (*Adj (adj:sg:nom:f:pos druga))) (*NP (*N (subst:sg:nom:f dziewczynka)))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:pl:nom:f Dziewczynki))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (AdjP (*Adj (adj:pl:loc:f:pos kolorowych))) (*NP (*N (subst:pl:loc:f sukienkach)))))) (*VP (*V (fin:pl:ter:imperf stoją))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f trawie)))) (VP (Punct (interp ,)) (*VP (*V (pcon:imperf puszczając))) (NP (*NP (*N (subst:pl:acc:f bańki))) (AdjP (*Adj (adj:pl:acc:f:pos mydlane)))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Grupa))) (NP (*N (subst:pl:gen:n:col dzieci)))) (*VP (*V (fin:sg:ter:imperf moczy))) (Part (part się)) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:f wodzie))) (PrepNP (*Prep (prep:gen:nwok z)) (NP (*N (subst:sg:gen:f fontanny))))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NumP (*Num (num:pl:nom:m1:rec:ncol Kilku))) (NP (*N (subst:pl:gen:m1 chłopców)))) (*VP (*V (fin:sg:ter:imperf kąpie))) (Part (part się)) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:f fontannie))) (PrepNP (*Prep (prep:gen obok)) (NP (*NP (*N (subst:pl:gen:m3 stolików))) (CP (Punct (interp ,)) (*S (PrepAdjP (*Prep (prep:loc przy)) (AdjP (*Adj (adj:pl:loc:m3:pos których)))) (*VP (*V (fin:pl:ter:imperf siedzą))) (NP (*N (subst:pl:nom:m1 ludzie)))))))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Dwójka))) (NP (AdjP (*Adj (adj:pl:gen:n:pos nagich))) (*NP (*N (subst:pl:gen:n:col dzieci))) (AdjP (*AdjP (*Adj (ppas:pl:gen:n:perf:aff ubrudzonych))) (NP (*N (subst:pl:inst:f farbkami)))))) (*VP (*V (fin:sg:ter:imperf siedzi))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f podłodze)))) (PrepNP (*Prep (prep:gen obok)) (NP (AdjP (*Adj (adj:pl:gen:f:pos porozrzucanych))) (*NP (*N (subst:pl:gen:f kartek)))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (S (NP (*NumP (*Num (num:pl:nom:n:rec:col Dwoje))) (NP (AdjP (AdjP (*Adj (adj:pl:gen:n:pos nagich))) (*Conj (interp ,)) (AdjP (*Adj (adj:pl:gen:n:pos małych)))) (*NP (*N (subst:pl:gen:n:col dzieci))))) (*VP (*V (fin:sg:ter:imperf siedzi))) (PrepNP (*Prep (prep:gen naprzeciwko)) (NP (*N (siebie:gen siebie))))) (*Conj (conj i)) (S (NP (AdjP (*Adj (adj:sg:nom:n:com większe))) (*NP (*N (subst:sg:nom:n:col dziecko)))) (*VP (*V (fin:sg:ter:imperf smaruje))) (NP (*N (subst:sg:inst:f farbą))) (NP (AdjP (*Adj (adj:sg:acc:n:com mniejsze))) (*NP (*N (subst:sg:acc:n:col dziecko)))))) (Punct (interp .))))\r\n", + "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Dziewczynka))) (PrepNP (*Prep (prep:loc o)) (NP (AdjP (*Adj (adj:pl:loc:n:pos ciemnych))) (*NP (*N (subst:pl:loc:n:col oczach)))))) (*VP (*V (fin:sg:ter:imperf patrzy))) (PrepNP (*Prep (prep:acc na)) (NP (AdjP (*Adj (adj:sg:acc:m3:pos czarny))) (*NP (*N (subst:sg:acc:m3 przedmiot))) (CP (Punct (interp ,)) (*S (AdjP (*Adj (adj:sg:acc:m3:pos który))) (*VP (*V (fin:sg:ter:imperf trzyma))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:sg:loc:f ręce))))))))) (Punct (interp .))))\r\n" + ] + } + ], + "source": [ + "! head {BRACKETS_DIR}/pdbc-cont-train.dat" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "TF_zajecia", + "language": "python", + "name": "tf_zajecia" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.6" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/BeNePar/TrainAndParse.ipynb a/BeNePar/TrainAndParse.ipynb new file mode 100644 index 0000000..34a3065 --- /dev/null +++ a/BeNePar/TrainAndParse.ipynb @@ -0,0 +1,973 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 5, + "id": "d8404675", + "metadata": {}, + "outputs": [], + "source": [ + "#BENEPAR = '/home/kkrasnowska/benepar_experiments/self-attentive-parser/src/main.py'" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "88603098", + "metadata": {}, + "outputs": [], + "source": [ + "#! mkdir models" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "d5aedb53", + "metadata": {}, + "outputs": [], + "source": [ + "#! python {BENEPAR} train \\\n", + "# --train-path brackets/pdbc-cont-train.dat \\\n", + "# --dev-path brackets/pdbc-cont-validation.dat \\\n", + "# --evalb-dir /home/kkrasnowska/benepar_experiments/self-attentive-parser/EVALB_SPMRL \\\n", + "# --use-pretrained --pretrained-model \"allegro/herbert-large-cased\" \\\n", + "# --use-encoder --num-layers 2 \\\n", + "# --predict-tags \\\n", + "# --model-path-base models" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "3f6aaf27", + "metadata": {}, + "outputs": [], + "source": [ + "from IPython.display import display, HTML" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "8d9d5103", + "metadata": {}, + "outputs": [], + "source": [ + "import benepar\n", + "import nltk\n", + "import spacy" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "c56eda57", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertModel: ['cls.predictions.transform.LayerNorm.bias', 'cls.sso.sso_relationship.weight', 'cls.predictions.transform.dense.weight', 'cls.sso.sso_relationship.bias', 'cls.predictions.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.decoder.bias']\n", + "- This IS expected if you are initializing BertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n", + "- This IS NOT expected if you are initializing BertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n" + ] + } + ], + "source": [ + "MODEL = 'models_dev=97.36.pt'\n", + "parser = benepar.Parser(MODEL)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "35ffd9af", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "06ae821c", + "metadata": {}, + "outputs": [], + "source": [ + "def postprocess(tree):\n", + " for node in tree.subtrees():\n", + " l = node.label()\n", + " node.set_label(l.replace('LPAR', '(').replace('RPAR', ')'))\n", + " for i, child in enumerate(node):\n", + " if type(child) == str:\n", + " node[i] = child.replace('-LSB-', '[').replace('-RSB-', ']')\n", + " return tree\n", + "\n", + "def parse_tokenized_sentences(sentences, parser):\n", + " [benepar.InputSentence(words=tokens) for tokens in sentences]\n", + " return list(map(postprocess, parser.parse_sents(\n", + " [benepar.InputSentence(words=tokens) for tokens in sentences]\n", + " )))\n", + "\n", + "def parse_sentence(sentence, parser):\n", + " return parse_tokenized_sentences([sentence.split()], parser)[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "c96dc9d9", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "You're using a HerbertTokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.\n", + "/home/kkrasnowska/venvs/torch_benepar/lib/python3.10/site-packages/torch/distributions/distribution.py:44: UserWarning: <class 'torch_struct.distributions.TreeCRF'> does not define `arg_constraints`. Please set `arg_constraints = {}` or initialize the distribution with `validate_args=False` to turn off validation.\n", + " warnings.warn(f'{self.__class__} does not define `arg_constraints`. ' +\n" + ] + }, + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"312px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,512.0,312.0\" width=\"512px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">TOP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"12.5%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">[</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"6.25%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"75%\" x=\"12.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"35.4167%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:nom:m2</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Koty</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"17.7083%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"12.5%\" x=\"35.4167%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">pred</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">to</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"41.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"35.4167%\" x=\"47.9167%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:nom:m1</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">złodzieje</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"65.625%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.6667%\" x=\"83.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"91.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"12.5%\" x=\"87.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">]</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"93.75%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('TOP', [Tree('ROOT', [Tree('Punct', [Tree('interp', ['['])]), Tree('*S', [Tree('NP', [Tree('*N', [Tree('subst:pl:nom:m2', ['Koty'])])]), Tree('*VP', [Tree('*V', [Tree('pred', ['to'])])]), Tree('NP', [Tree('*N', [Tree('subst:pl:nom:m1', ['złodzieje'])])]), Tree('Punct', [Tree('interp', ['.'])])]), Tree('Punct', [Tree('interp', [']'])])])])" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "parse_sentence('[ Koty to złodzieje . ]', parser)" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "d62d1e31", + "metadata": {}, + "outputs": [ + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"312px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,560.0,312.0\" width=\"560px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">TOP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"88.5714%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"72.5806%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"44.4444%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Widział</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.2222%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.5556%\" x=\"44.4444%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">aglt:sg:pri:imperf:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">am</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.2222%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"36.2903%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"27.4194%\" x=\"72.5806%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:m2</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">kotka</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"86.2903%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"44.2857%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"11.4286%\" x=\"88.5714%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"94.2857%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('TOP', [Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['Widział']), Tree('aglt:sg:pri:imperf:nwok', ['am'])])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:m2', ['kotka'])])])]), Tree('Punct', [Tree('interp', ['.'])])])])" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "parse_sentence('Widział am kotka .', parser)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "418db531", + "metadata": {}, + "outputs": [], + "source": [ + "with open('brackets/pdbc-cont-validation.dat') as f:\n", + " val_trees = [postprocess(nltk.Tree.fromstring(l.strip('\\n'))) for l in f.readlines()]\n", + "with open('brackets/pdbc-cont-test.dat') as f:\n", + " test_trees = [postprocess(nltk.Tree.fromstring(l.strip('\\n'))) for l in f.readlines()]" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "2e5f4739", + "metadata": {}, + "outputs": [], + "source": [ + "val_sentences = [tree.leaves() for tree in val_trees]\n", + "test_sentences = [tree.leaves() for tree in test_trees]" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "6c52ef3f", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/kkrasnowska/venvs/torch_benepar/lib/python3.10/site-packages/torch/distributions/distribution.py:44: UserWarning: <class 'torch_struct.distributions.TreeCRF'> does not define `arg_constraints`. Please set `arg_constraints = {}` or initialize the distribution with `validate_args=False` to turn off validation.\n", + " warnings.warn(f'{self.__class__} does not define `arg_constraints`. ' +\n" + ] + } + ], + "source": [ + "val_pred_trees = parse_tokenized_sentences(val_sentences, parser)\n", + "test_pred_trees = parse_tokenized_sentences(test_sentences, parser)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "d6d45ba8", + "metadata": {}, + "outputs": [], + "source": [ + "assert(len(val_trees) == len(val_pred_trees))\n", + "assert(len(test_trees) == len(test_pred_trees))" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "399c3f08", + "metadata": {}, + "outputs": [], + "source": [ + "# drop the TOP\n", + "val_trees = [t[0] for t in val_trees]\n", + "test_trees = [t[0] for t in test_trees]\n", + "val_pred_trees = [t[0] for t in val_pred_trees]\n", + "test_pred_trees = [t[0] for t in test_pred_trees]" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "827be810", + "metadata": {}, + "outputs": [ + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"504px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,2808.0,504.0\" width=\"2808px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"97.7208%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"41.691%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"22.3776%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">W</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:loc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">samolocie</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"11.1888%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"13.986%\" x=\"22.3776%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">czytał</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"29.3706%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"63.6364%\" x=\"36.3636%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"18.6813%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:acc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">wycinki</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"9.34066%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"81.3187%\" x=\"18.6813%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"20.2703%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">z</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"10.1351%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"79.7297%\" x=\"20.2703%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"27.1186%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prasy</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"13.5593%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"72.8814%\" x=\"27.1186%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"41.8605%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polskiej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.9302%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.2791%\" x=\"41.8605%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">i</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"41.8605%\" x=\"58.1395%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polonijnej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"79.0698%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"63.5593%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"60.1351%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"59.3407%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"68.1818%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.8455%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.33236%\" x=\"41.691%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">-</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"42.8571%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.9767%\" x=\"44.0233%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"17.7083%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepAdjP</text></svg><svg width=\"44.1176%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.0588%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.8824%\" x=\"44.1176%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:loc:m3:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">każdym</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0588%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"8.85417%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"6.77083%\" x=\"17.7083%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">imps:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">piętnowano</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.0938%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"17.7083%\" x=\"24.4792%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppron3:sg:acc:m1:ter:nakc:npraep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">go</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"33.3333%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"57.8125%\" x=\"42.1875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Compar</text></svg><svg width=\"6.30631%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">jako</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.15315%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"93.6937%\" x=\"6.30631%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"7.69231%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.84615%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"7.69231%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">bez</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">umiaru</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.0769%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"24.0385%\" x=\"38.4615%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppas:sg:acc:m1:perf:aff</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">zapatrzonego</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50.4808%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"29.8077%\" x=\"62.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"48.3871%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:acc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"24.1935%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"51.6129%\" x=\"48.3871%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Moskwę</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"74.1935%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"77.4038%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"7.69231%\" x=\"92.3077%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"96.1538%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"53.1532%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.0938%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0117%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"48.8604%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.2792%\" x=\"97.7208%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"98.8604%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('ROOT', [Tree('*S', [Tree('S', [Tree('PrepNP', [Tree('*Prep', [Tree('prep:loc:nwok', ['W'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:loc:m3', ['samolocie'])])])]), Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['czytał'])])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:pl:acc:m3', ['wycinki'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['z'])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:sg:gen:f', ['prasy'])])]), Tree('AdjP', [Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polskiej'])])]), Tree('*Conj', [Tree('conj', ['i'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polonijnej'])])])])])])])]), Tree('*Conj', [Tree('interp', ['-'])]), Tree('S', [Tree('PrepAdjP', [Tree('*Prep', [Tree('prep:loc:nwok', ['w'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:loc:m3:pos', ['każdym'])])])]), Tree('*VP', [Tree('*V', [Tree('imps:imperf', ['piętnowano'])])]), Tree('NP', [Tree('*N', [Tree('ppron3:sg:acc:m1:ter:nakc:npraep', ['go'])])]), Tree('Compar', [Tree('*Comp', [Tree('comp', ['jako'])]), Tree('AdjP', [Tree('Punct', [Tree('interp', ['\"'])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['bez'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:gen:m3', ['umiaru'])])])]), Tree('*AdjP', [Tree('*Adj', [Tree('ppas:sg:acc:m1:perf:aff', ['zapatrzonego'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:acc:nwok', ['w'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:f', ['Moskwę'])])])]), Tree('Punct', [Tree('interp', ['\"'])])])])])]), Tree('Punct', [Tree('interp', ['.'])])])" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "val_trees[504]" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "1059e782", + "metadata": {}, + "outputs": [ + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"504px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,2808.0,504.0\" width=\"2808px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"97.7208%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"41.691%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"22.3776%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">W</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:loc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">samolocie</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"11.1888%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"13.986%\" x=\"22.3776%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">czytał</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"29.3706%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"63.6364%\" x=\"36.3636%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"18.6813%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:acc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">wycinki</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"9.34066%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"81.3187%\" x=\"18.6813%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"20.2703%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">z</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"10.1351%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"79.7297%\" x=\"20.2703%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"27.1186%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prasy</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"13.5593%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"72.8814%\" x=\"27.1186%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"41.8605%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polskiej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.9302%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.2791%\" x=\"41.8605%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">i</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"41.8605%\" x=\"58.1395%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polonijnej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"79.0698%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"63.5593%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"60.1351%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"59.3407%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"68.1818%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.8455%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.33236%\" x=\"41.691%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">-</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"42.8571%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.9767%\" x=\"44.0233%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"17.7083%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepAdjP</text></svg><svg width=\"44.1176%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.0588%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.8824%\" x=\"44.1176%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:loc:m3:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">każdym</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0588%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"8.85417%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"6.77083%\" x=\"17.7083%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">imps:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">piętnowano</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.0938%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"17.7083%\" x=\"24.4792%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppron3:sg:acc:m1:ter:nakc:npraep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">go</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"33.3333%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"57.8125%\" x=\"42.1875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Compar</text></svg><svg width=\"6.30631%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">jako</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.15315%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"93.6937%\" x=\"6.30631%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"7.69231%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.84615%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"7.69231%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">bez</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">umiaru</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.0769%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"24.0385%\" x=\"38.4615%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppas:sg:acc:m1:perf:aff</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">zapatrzonego</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50.4808%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"29.8077%\" x=\"62.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"48.3871%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:acc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"24.1935%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"51.6129%\" x=\"48.3871%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Moskwę</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"74.1935%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"77.4038%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"7.69231%\" x=\"92.3077%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"96.1538%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"53.1532%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.0938%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0117%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"48.8604%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.2792%\" x=\"97.7208%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"98.8604%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('ROOT', [Tree('*S', [Tree('S', [Tree('PrepNP', [Tree('*Prep', [Tree('prep:loc:nwok', ['W'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:loc:m3', ['samolocie'])])])]), Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['czytał'])])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:pl:acc:m3', ['wycinki'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['z'])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:sg:gen:f', ['prasy'])])]), Tree('AdjP', [Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polskiej'])])]), Tree('*Conj', [Tree('conj', ['i'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polonijnej'])])])])])])])]), Tree('*Conj', [Tree('interp', ['-'])]), Tree('S', [Tree('PrepAdjP', [Tree('*Prep', [Tree('prep:loc:nwok', ['w'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:loc:m3:pos', ['każdym'])])])]), Tree('*VP', [Tree('*V', [Tree('imps:imperf', ['piętnowano'])])]), Tree('NP', [Tree('*N', [Tree('ppron3:sg:acc:m1:ter:nakc:npraep', ['go'])])]), Tree('Compar', [Tree('*Comp', [Tree('comp', ['jako'])]), Tree('AdjP', [Tree('Punct', [Tree('interp', ['\"'])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['bez'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:gen:m3', ['umiaru'])])])]), Tree('*AdjP', [Tree('*Adj', [Tree('ppas:sg:acc:m1:perf:aff', ['zapatrzonego'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:acc:nwok', ['w'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:f', ['Moskwę'])])])]), Tree('Punct', [Tree('interp', ['\"'])])])])])]), Tree('Punct', [Tree('interp', ['.'])])])" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "val_pred_trees[504]" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "id": "4d6c7096", + "metadata": {}, + "outputs": [], + "source": [ + "'''\n", + "def undummy(_tree):\n", + " tree = _tree.copy(deep=True)\n", + " for node in tree.subtrees():\n", + " for i, child in enumerate(node):\n", + " if type(child) != str and child.label() == 'DUMMY_PRE':\n", + " node[i] = child[0]\n", + " return tree\n", + "\n", + "'''\n", + "def untag(_tree):\n", + " tree = _tree.copy(deep=True)\n", + " for node in tree.subtrees():\n", + " for i, child in enumerate(node):\n", + " if type(child) != str and set(map(type, child)) == {str}:\n", + " assert(len(child) == 1)\n", + " node[i] = child[0]\n", + " #if set(map(type, node)) == {str}:\n", + " # assert(len(node) == 1)\n", + " # node.set_label('xxx')\n", + " return tree\n", + "\n", + "'''\n", + "\n", + "ZDANIE_HEADS = {'*ff', '*spójnik', '*przec', '*zdanie', '*formawykrz'}\n", + "ZDANIE_HEADS2 = set(l.strip('*') for l in ZDANIE_HEADS)\n", + "ZDANIE_HEAD_HIERARCHY = ('ff', 'spójnik', 'przec', 'zdanie')\n", + "\n", + "\n", + "def correct(_tree):\n", + " tree = _tree.copy(deep=True)\n", + " for node in tree.subtrees():\n", + " if len(node) == 1 and type(node[0]) != str and node.label() == node[0].label():\n", + " new_children = [child for child in node[0]]\n", + " node.pop()\n", + " node += new_children\n", + " for node in tree.subtrees():\n", + " if 'zdanie' in node.label():\n", + " heads = []\n", + " non_heads = []\n", + " for child in node:\n", + " if child.label().startswith('*') and child.label() not in ZDANIE_HEADS:\n", + " child.set_label(child.label()[1:])\n", + " (heads if child.label().startswith('*') else non_heads).append(child)\n", + " \n", + " return tree\n", + "''';" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "id": "4a26b2e1", + "metadata": { + "scrolled": false + }, + "outputs": [], + "source": [ + "from collections import Counter, defaultdict\n", + "\n", + "c = Counter()\n", + "\n", + "def tree2spans(_tree):\n", + " # make tokens unique\n", + " tree = _tree.copy(deep=True)\n", + " idx = 0\n", + " for node in tree.subtrees():\n", + " for i, child in enumerate(node):\n", + " if type(child) == str:\n", + " node[i] = f'{idx}##{child}'\n", + " idx += 1\n", + " spans = []\n", + " for node in tree.subtrees():\n", + " spans.append((\n", + " node.label(),\n", + " tuple(child if type(child) == str else child.label() for child in node),\n", + " ' '.join(node.leaves())\n", + " ))\n", + " assert (len(set(spans)) == len(spans))\n", + " return set(spans)\n", + "\n", + "def spans2dict(spans):\n", + " s = defaultdict(set)\n", + " for node, children, text in spans:\n", + " if node in s[text]:\n", + " print('!!!!!!!!!!!!!!!', node, text)\n", + " display(spans)\n", + " s[text].add(node)\n", + " return s\n", + "\n", + "def spans2errors(spans_gold, spans_pred):\n", + " sg = spans2dict(spans_gold)\n", + " sp = spans2dict(spans_pred)\n", + " errors = []\n", + " tp, fp, fn = 0, 0, 0\n", + " for text in set(sg.keys()).union(sp.keys()):\n", + " txt = ' '.join('X' for _ in text.split())\n", + " errs = []\n", + " for span in sg[text].union(sp[text]):\n", + " if span in sg[text] and span not in sp[text]:\n", + " errs.append(f'-{span}')\n", + " fn += 1\n", + " elif span not in sg[text] and span in sp[text]:\n", + " errs.append(f'+{span}')\n", + " fp += 1\n", + " else:\n", + " tp += 1\n", + " if errs:\n", + " errors.append((tuple(sorted(errs)), text))\n", + " #display(errors)\n", + " #print('tp:', tp, 'fp:', fp, 'fn:', fn)\n", + " #p, r = tp / (tp + fp), tp / (tp + fn)\n", + " #f1 = 2 * tp / (2 * tp + fp + fn)\n", + " #print('precision: ', p)\n", + " #print('recall: ', r)\n", + " #print('f1: ', f1)\n", + " return (tp, fp, fn), errors" + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "id": "397e3750", + "metadata": {}, + "outputs": [], + "source": [ + "def eval_trees(trees_gold, trees_pred):\n", + " evaluation, errors = [], []\n", + " for _tree_gold, _tree_pred in list(zip(trees_gold, trees_pred)):\n", + " try:\n", + " assert(''.join(_tree_gold.leaves()) == ''.join(_tree_pred.leaves()))\n", + " except:\n", + " print(_tree_gold.leaves())\n", + " print(_tree_pred.leaves())\n", + " raise\n", + " tree_gold = untag(_tree_gold)\n", + " tree_pred = untag(_tree_pred)\n", + " spans_gold = tree2spans(tree_gold)\n", + " spans_pred = tree2spans(tree_pred)\n", + " if tree_gold.leaves() == ['Poszedł', 'em', 'do', 'adwokata', '.']:\n", + " display(tree_gold)\n", + " display(tree_pred)\n", + " print(spans_gold)\n", + " print(spans_pred)\n", + " try:\n", + " evl, errs = spans2errors(spans_gold, spans_pred)\n", + " evaluation.append(evl)\n", + " errors += [(err, _tree_gold, _tree_pred) for err in errs]\n", + " except:\n", + " display(tree_pred)\n", + " display2(_tree_pred)\n", + " print(i)\n", + " raise\n", + " return evaluation, errors" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "5dcd68fd", + "metadata": {}, + "outputs": [ + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"264px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,296.0,264.0\" width=\"296px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"81.0811%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"43.3333%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"69.2308%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Poszedł</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"34.6154%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"69.2308%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">em</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"84.6154%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"56.6667%\" x=\"43.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"41.1765%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">do</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.5882%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"58.8235%\" x=\"41.1765%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adwokata</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"70.5882%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"40.5405%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"18.9189%\" x=\"81.0811%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"90.5405%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', ['Poszedł', 'em'])]), Tree('PrepNP', [Tree('*Prep', ['do']), Tree('NP', [Tree('*N', ['adwokata'])])])]), Tree('Punct', ['.'])])" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/svg+xml": [ + "<svg baseProfile=\"full\" height=\"264px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,296.0,264.0\" width=\"296px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"81.0811%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"43.3333%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"69.2308%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Poszedł</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"34.6154%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"69.2308%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">em</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"84.6154%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"56.6667%\" x=\"43.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"41.1765%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">do</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.5882%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"58.8235%\" x=\"41.1765%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adwokata</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"70.5882%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"40.5405%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"18.9189%\" x=\"81.0811%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"90.5405%\" y1=\"1.2em\" y2=\"3em\" /></svg>" + ], + "text/plain": [ + "Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', ['Poszedł', 'em'])]), Tree('PrepNP', [Tree('*Prep', ['do']), Tree('NP', [Tree('*N', ['adwokata'])])])]), Tree('Punct', ['.'])])" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{('Punct', ('4##.',), '4##.'), ('*Prep', ('2##do',), '2##do'), ('ROOT', ('*S', 'Punct'), '0##Poszedł 1##em 2##do 3##adwokata 4##.'), ('NP', ('*N',), '3##adwokata'), ('*V', ('0##Poszedł', '1##em'), '0##Poszedł 1##em'), ('PrepNP', ('*Prep', 'NP'), '2##do 3##adwokata'), ('*S', ('*VP', 'PrepNP'), '0##Poszedł 1##em 2##do 3##adwokata'), ('*N', ('3##adwokata',), '3##adwokata'), ('*VP', ('*V',), '0##Poszedł 1##em')}\n", + "{('Punct', ('4##.',), '4##.'), ('*Prep', ('2##do',), '2##do'), ('ROOT', ('*S', 'Punct'), '0##Poszedł 1##em 2##do 3##adwokata 4##.'), ('NP', ('*N',), '3##adwokata'), ('*V', ('0##Poszedł', '1##em'), '0##Poszedł 1##em'), ('PrepNP', ('*Prep', 'NP'), '2##do 3##adwokata'), ('*S', ('*VP', 'PrepNP'), '0##Poszedł 1##em 2##do 3##adwokata'), ('*N', ('3##adwokata',), '3##adwokata'), ('*VP', ('*V',), '0##Poszedł 1##em')}\n", + "!!!!!!!!!!!!!!! *AdvP 0##Trudno\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adv', ('0##Trudno',), '0##Trudno'),\n", + " ('*AdvP', ('*Adv',), '0##Trudno'),\n", + " ('*AdvP', ('*AdvP',), '0##Trudno'),\n", + " ('Punct', ('1##.',), '1##.'),\n", + " ('ROOT', ('*AdvP', 'Punct'), '0##Trudno 1##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *AdvP 0##Trudno\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adv', ('0##Trudno',), '0##Trudno'),\n", + " ('*AdvP', ('*Adv',), '0##Trudno'),\n", + " ('*AdvP', ('*AdvP',), '0##Trudno'),\n", + " ('Punct', ('1##.',), '1##.'),\n", + " ('ROOT', ('*AdvP', 'Punct'), '0##Trudno 1##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Comp', ('3##iż',), '3##iż'),\n", + " ('*Comp', ('7##iż',), '7##iż'),\n", + " ('*Conj', ('6##,',), '6##,'),\n", + " ('*N', ('1##tym',), '1##tym'),\n", + " ('*N', ('11##nic',), '11##nic'),\n", + " ('*N', ('5##nikim',), '5##nikim'),\n", + " ('*N', ('9##cię',), '9##cię'),\n", + " ('*NP', ('*N',), '1##tym'),\n", + " ('*Prep', ('0##O',), '0##O'),\n", + " ('*Prep', ('10##za',), '10##za'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('*V', ('4##jesteś',), '4##jesteś'),\n", + " ('*V', ('8##mają',), '8##mają'),\n", + " ('*VP', ('*V',), '4##jesteś'),\n", + " ('*VP', ('*V',), '8##mają'),\n", + " ('CP', ('*Comp', 'S'), '7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('CP',\n", + " ('CP', '*Conj', 'CP'),\n", + " '2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('CP', ('Punct', '*Comp', 'S'), '2##, 3##iż 4##jesteś 5##nikim'),\n", + " ('NP', ('*N',), '11##nic'),\n", + " ('NP', ('*N',), '5##nikim'),\n", + " ('NP', ('*N',), '9##cię'),\n", + " ('NP',\n", + " ('*NP', 'CP'),\n", + " '1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('PrepNP', ('*Prep', 'NP'), '10##za 11##nic'),\n", + " ('Punct', ('12##!',), '12##!'),\n", + " ('Punct', ('2##,',), '2##,'),\n", + " ('ROOT',\n", + " ('*PrepNP', 'Punct'),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic 12##!'),\n", + " ('S', ('*VP', 'NP'), '4##jesteś 5##nikim'),\n", + " ('S', ('*VP', 'NP', 'PrepNP'), '8##mają 9##cię 10##za 11##nic')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Comp', ('3##iż',), '3##iż'),\n", + " ('*Comp', ('7##iż',), '7##iż'),\n", + " ('*Conj', ('6##,',), '6##,'),\n", + " ('*N', ('1##tym',), '1##tym'),\n", + " ('*N', ('11##nic',), '11##nic'),\n", + " ('*N', ('5##nikim',), '5##nikim'),\n", + " ('*N', ('9##cię',), '9##cię'),\n", + " ('*NP', ('*N',), '1##tym'),\n", + " ('*Prep', ('0##O',), '0##O'),\n", + " ('*Prep', ('10##za',), '10##za'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('*V', ('4##jesteś',), '4##jesteś'),\n", + " ('*V', ('8##mają',), '8##mają'),\n", + " ('*VP', ('*V',), '4##jesteś'),\n", + " ('*VP', ('*V',), '8##mają'),\n", + " ('CP', ('*Comp', 'S'), '7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('CP',\n", + " ('CP', '*Conj', 'CP'),\n", + " '2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('CP', ('Punct', '*Comp', 'S'), '2##, 3##iż 4##jesteś 5##nikim'),\n", + " ('NP', ('*N',), '11##nic'),\n", + " ('NP', ('*N',), '5##nikim'),\n", + " ('NP', ('*N',), '9##cię'),\n", + " ('NP',\n", + " ('*NP', 'CP'),\n", + " '1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n", + " ('PrepNP', ('*Prep', 'NP'), '10##za 11##nic'),\n", + " ('Punct', ('12##!',), '12##!'),\n", + " ('Punct', ('2##,',), '2##,'),\n", + " ('ROOT',\n", + " ('*PrepNP', 'Punct'),\n", + " '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic 12##!'),\n", + " ('S', ('*VP', 'NP'), '4##jesteś 5##nikim'),\n", + " ('S', ('*VP', 'NP', 'PrepNP'), '8##mają 9##cię 10##za 11##nic')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *NP 0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adj', ('1##małe',), '1##małe'),\n", + " ('*N', ('2##groszki',), '2##groszki'),\n", + " ('*N', ('4##strąku',), '4##strąku'),\n", + " ('*N', ('6##tunelu',), '6##tunelu'),\n", + " ('*N', ('7##miłości',), '7##miłości'),\n", + " ('*NP', ('*N',), '2##groszki'),\n", + " ('*NP', ('*N',), '6##tunelu'),\n", + " ('*NP',\n", + " ('*NP',),\n", + " '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n", + " ('*NP',\n", + " ('*NumP', 'NP'),\n", + " '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n", + " ('*Num', ('0##Cztery',), '0##Cztery'),\n", + " ('*NumP', ('*Num',), '0##Cztery'),\n", + " ('*Prep', ('3##w',), '3##w'),\n", + " ('*Prep', ('5##w',), '5##w'),\n", + " ('AdjP', ('*Adj',), '1##małe'),\n", + " ('NP', ('*N',), '4##strąku'),\n", + " ('NP', ('*N',), '7##miłości'),\n", + " ('NP', ('*NP', 'NP'), '6##tunelu 7##miłości'),\n", + " ('NP',\n", + " ('AdjP', '*NP', 'PrepNP', 'PrepNP'),\n", + " '1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n", + " ('PrepNP', ('*Prep', 'NP'), '3##w 4##strąku'),\n", + " ('PrepNP', ('*Prep', 'NP'), '5##w 6##tunelu 7##miłości'),\n", + " ('Punct', ('8##.',), '8##.'),\n", + " ('ROOT',\n", + " ('*NP', 'Punct'),\n", + " '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości 8##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adv', ('3##gdy',), '3##gdy'),\n", + " ('*N', ('1##chwili',), '1##chwili'),\n", + " ('*N', ('7##Alpy',), '7##Alpy'),\n", + " ('*N', ('8##słonie',), '8##słonie'),\n", + " ('*N', ('9##Hannibala',), '9##Hannibala'),\n", + " ('*NP', ('*N',), '1##chwili'),\n", + " ('*NP', ('*N',), '8##słonie'),\n", + " ('*Prep', ('0##W',), '0##W'),\n", + " ('*Prep', ('6##przez',), '6##przez'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*S',\n", + " ('AdvP', '*VP', 'PrepNP', 'NP'),\n", + " '3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*V', ('4##przeprowadzał', '5##em'), '4##przeprowadzał 5##em'),\n", + " ('*VP', ('*V',), '4##przeprowadzał 5##em'),\n", + " ('AdvP', ('*Adv',), '3##gdy'),\n", + " ('CP',\n", + " ('Punct', '*S'),\n", + " '2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('NP', ('*N',), '7##Alpy'),\n", + " ('NP', ('*N',), '9##Hannibala'),\n", + " ('NP',\n", + " ('*NP', 'CP'),\n", + " '1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('NP', ('*NP', 'NP'), '8##słonie 9##Hannibala'),\n", + " ('PrepNP', ('*Prep', 'NP'), '6##przez 7##Alpy'),\n", + " ('Punct', ('10##.',), '10##.'),\n", + " ('Punct', ('2##,',), '2##,'),\n", + " ('ROOT',\n", + " ('*PrepNP', 'Punct'),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala 10##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adv', ('3##gdy',), '3##gdy'),\n", + " ('*N', ('1##chwili',), '1##chwili'),\n", + " ('*N', ('7##Alpy',), '7##Alpy'),\n", + " ('*N', ('8##słonie',), '8##słonie'),\n", + " ('*N', ('9##Hannibala',), '9##Hannibala'),\n", + " ('*NP', ('*N',), '1##chwili'),\n", + " ('*NP', ('*N',), '8##słonie'),\n", + " ('*Prep', ('0##W',), '0##W'),\n", + " ('*Prep', ('6##przez',), '6##przez'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*S',\n", + " ('AdvP', '*VP', 'PrepNP', 'NP'),\n", + " '3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('*V', ('4##przeprowadzał', '5##em'), '4##przeprowadzał 5##em'),\n", + " ('*VP', ('*V',), '4##przeprowadzał 5##em'),\n", + " ('AdvP', ('*Adv',), '3##gdy'),\n", + " ('CP',\n", + " ('Punct', '*S'),\n", + " '2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('NP', ('*N',), '7##Alpy'),\n", + " ('NP', ('*N',), '9##Hannibala'),\n", + " ('NP',\n", + " ('*NP', 'CP'),\n", + " '1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n", + " ('NP', ('*NP', 'NP'), '8##słonie 9##Hannibala'),\n", + " ('PrepNP', ('*Prep', 'NP'), '6##przez 7##Alpy'),\n", + " ('Punct', ('10##.',), '10##.'),\n", + " ('Punct', ('2##,',), '2##,'),\n", + " ('ROOT',\n", + " ('*PrepNP', 'Punct'),\n", + " '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala 10##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adj', ('2##roczną',), '2##roczną'),\n", + " ('*Adj', ('7##czternasty',), '7##czternasty'),\n", + " ('*N', ('3##misję',), '3##misję'),\n", + " ('*N', ('5##Tytana',), '5##Tytana'),\n", + " ('*N', ('8##księżyc',), '8##księżyc'),\n", + " ('*N', ('9##Saturna',), '9##Saturna'),\n", + " ('*NP', ('*N',), '3##misję'),\n", + " ('*NP', ('*N',), '5##Tytana'),\n", + " ('*NP', ('*N',), '8##księżyc'),\n", + " ('*Prep', ('1##na',), '1##na'),\n", + " ('*Prep', ('4##na',), '4##na'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('AdjP', ('*Adj',), '2##roczną'),\n", + " ('AdjP', ('*Adj',), '7##czternasty'),\n", + " ('NP', ('*N',), '9##Saturna'),\n", + " ('NP', ('*NP', 'NP'), '5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('NP',\n", + " ('AdjP', '*NP', 'PrepNP'),\n", + " '2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('NP',\n", + " ('Punct', 'AdjP', '*NP', 'NP'),\n", + " '6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('Punct', ('0##-',), '0##-'),\n", + " ('Punct', ('10##.',), '10##.'),\n", + " ('Punct', ('6##,',), '6##,'),\n", + " ('ROOT',\n", + " ('Punct', '*PrepNP', 'Punct'),\n", + " '0##- 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna 10##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "!!!!!!!!!!!!!!! *PrepNP 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna\n" + ] + }, + { + "data": { + "text/plain": [ + "{('*Adj', ('2##roczną',), '2##roczną'),\n", + " ('*Adj', ('7##czternasty',), '7##czternasty'),\n", + " ('*N', ('3##misję',), '3##misję'),\n", + " ('*N', ('5##Tytana',), '5##Tytana'),\n", + " ('*N', ('8##księżyc',), '8##księżyc'),\n", + " ('*N', ('9##Saturna',), '9##Saturna'),\n", + " ('*NP', ('*N',), '3##misję'),\n", + " ('*NP', ('*N',), '5##Tytana'),\n", + " ('*NP', ('*N',), '8##księżyc'),\n", + " ('*Prep', ('1##na',), '1##na'),\n", + " ('*Prep', ('4##na',), '4##na'),\n", + " ('*PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('*PrepNP',\n", + " ('*PrepNP',),\n", + " '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('AdjP', ('*Adj',), '2##roczną'),\n", + " ('AdjP', ('*Adj',), '7##czternasty'),\n", + " ('NP', ('*N',), '9##Saturna'),\n", + " ('NP', ('*NP', 'NP'), '5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('NP',\n", + " ('AdjP', '*NP', 'PrepNP'),\n", + " '2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('NP',\n", + " ('Punct', 'AdjP', '*NP', 'NP'),\n", + " '6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('PrepNP',\n", + " ('*Prep', 'NP'),\n", + " '4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n", + " ('Punct', ('0##-',), '0##-'),\n", + " ('Punct', ('10##.',), '10##.'),\n", + " ('Punct', ('6##,',), '6##,'),\n", + " ('ROOT',\n", + " ('Punct', '*PrepNP', 'Punct'),\n", + " '0##- 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna 10##.')}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "evaluation_val, errors_val = eval_trees(val_trees, val_pred_trees)\n", + "evaluation_test, errors_test = eval_trees(test_trees, test_pred_trees)" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "65af3522", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "DEV:\n", + "precision: 0.974400637684714\n", + "recall: 0.9742960930674555\n", + "f1: 0.9743483625717548\n" + ] + } + ], + "source": [ + "tp, fp, fn = list(map(sum, zip(*evaluation_val)))\n", + "p, r = tp / (tp + fp), tp / (tp + fn)\n", + "f1 = 2 * tp / (2 * tp + fp + fn)\n", + "print('DEV:')\n", + "print('precision: ', p)\n", + "print('recall: ', r)\n", + "print('f1: ', f1)" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "id": "8e0f3f93", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "TEST:\n", + "precision: 0.9774147274466051\n", + "recall: 0.9775082092645137\n", + "f1: 0.9774614661204711\n" + ] + } + ], + "source": [ + "tp, fp, fn = list(map(sum, zip(*evaluation_test)))\n", + "p, r = tp / (tp + fp), tp / (tp + fn)\n", + "f1 = 2 * tp / (2 * tp + fp + fn)\n", + "print('TEST:')\n", + "print('precision: ', p)\n", + "print('recall: ', r)\n", + "print('f1: ', f1)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "302b2333", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "torch_benepar", + "language": "python", + "name": "torch_benepar" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.6" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/COMBO/DataPreparation.ipynb a/COMBO/DataPreparation.ipynb new file mode 100644 index 0000000..fde3938 --- /dev/null +++ a/COMBO/DataPreparation.ipynb @@ -0,0 +1,213 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 46, + "id": "5cd26f6f", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "from datasets import load_dataset\n", + "\n", + "from IPython.display import display" + ] + }, + { + "cell_type": "code", + "execution_count": 47, + "id": "fecef4af", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "1c89c7103bba4347a3fa7d23cac42cfe", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/3 [00:00<?, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "pdbc_dataset = load_dataset('../pdb_c_beta')" + ] + }, + { + "cell_type": "code", + "execution_count": 48, + "id": "23da801f", + "metadata": {}, + "outputs": [], + "source": [ + "CONLLU_DIR = 'connlu'\n", + "! rm -r {CONLLU_DIR}\n", + "! mkdir {CONLLU_DIR}" + ] + }, + { + "cell_type": "code", + "execution_count": 50, + "id": "91fb3bf3", + "metadata": {}, + "outputs": [], + "source": [ + "import sys\n", + "sys.path.append('../')\n", + "from neural_parser.hybrid_tree_utils import tree_from_dataset_instance" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "id": "c105feff", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "train\n", + " connlu/pdbc-train.conllu\n", + " 17659\n", + " connlu/pdbc-cont-train.conllu\n", + " 15903\n", + "validation\n", + " connlu/pdbc-validation.conllu\n", + " 2211\n", + " connlu/pdbc-cont-validation.conllu\n", + " 1980\n", + "test\n", + " connlu/pdbc-test.conllu\n", + " 2205\n", + " connlu/pdbc-cont-test.conllu\n", + " 1990\n" + ] + } + ], + "source": [ + "features = pdbc_dataset['train'].features\n", + "\n", + "for part, dataset in pdbc_dataset.items():\n", + " print(part)\n", + " s_cont, s_all = [], [] \n", + " for sentence in dataset:\n", + " # TODO! check if discont\n", + " tokens = sentence['tokens']\n", + " lemmas = sentence['lemmas']\n", + " heads = sentence['heads']\n", + " heads = [h + 1 if h is not None else 0 for i, h in enumerate(heads)]\n", + " deprels = [features['deprels'].feature.int2str(d) for d in sentence['deprels']]\n", + " deprels = ['root' if deprel == 'ROOT' else deprel for deprel in deprels]\n", + " rows = [f'# text = {\" \".join(tokens)}'] + [\n", + " f'{i + 1}\\t{t}\\t{l}\\t_\\t_\\t_\\t{h}\\t{d}\\t{h}:{d}\\t_'\n", + " for i, (t, l, h, d) in enumerate(zip(tokens, lemmas, heads, deprels))\n", + " ]\n", + " s_all.append(rows)\n", + " if tree_from_dataset_instance(sentence, features).is_continuous():\n", + " s_cont.append(rows)\n", + " f_all = os.path.join(CONLLU_DIR, f'pdbc-{part}.conllu')\n", + " f_cont = os.path.join(CONLLU_DIR, f'pdbc-cont-{part}.conllu')\n", + " with open(f_all, 'w') as f:\n", + " print(' ', f_all)\n", + " print(' ', len(s_all))\n", + " for rows in s_all:\n", + " print('\\n'.join(rows), end='\\n\\n', file=f)\n", + " with open(f_cont, 'w') as f:\n", + " print(' ', f_cont)\n", + " print(' ', len(s_cont))\n", + " for rows in s_cont:\n", + " print('\\n'.join(rows), end='\\n\\n', file=f)" + ] + }, + { + "cell_type": "code", + "execution_count": 61, + "id": "c849233c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " 32509 319813 1398303 connlu/pdbc-cont-test.conllu\n", + " 32509 319813 1198902 connlu/pdbc-cont-test-pred.conllu\n", + " 271337 2682725 11781617 connlu/pdbc-cont-train.conllu\n", + " 33491 330792 1452373 connlu/pdbc-cont-validation.conllu\n", + " 33491 330792 1244192 connlu/pdbc-cont-validation-pred.conllu\n", + " 37754 373431 1639937 connlu/pdbc-test.conllu\n", + " 37754 373431 1406776 connlu/pdbc-test-pred.conllu\n", + " 315364 3133712 13808053 connlu/pdbc-train.conllu\n", + " 38987 386865 1704685 connlu/pdbc-validation.conllu\n", + " 38987 386865 1461922 connlu/pdbc-validation-pred.conllu\n", + " 872183 8638239 37096760 total\n" + ] + } + ], + "source": [ + "! wc {CONLLU_DIR}/*.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "id": "6b571716", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Skośnooka dziewczynka trzyma w rękach drewniane pałeczki , a przed nią znajdują się naczynia kuchenne .\r\n", + "1\tSkośnooka\tskośnooki\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n", + "2\tdziewczynka\tdziewczynka\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "3\ttrzyma\ttrzymać\t_\t_\t_\t9\tconjunct\t9:conjunct\t_\r\n", + "4\tw\tw\t_\t_\t_\t3\tadjunct_locat\t3:adjunct_locat\t_\r\n", + "5\trękach\tręka\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n", + "6\tdrewniane\tdrewniany\t_\t_\t_\t7\tadjunct\t7:adjunct\t_\r\n", + "7\tpałeczki\tpałeczka\t_\t_\t_\t3\tobj\t3:obj\t_\r\n", + "8\t,\t,\t_\t_\t_\t9\tpunct\t9:punct\t_\r\n", + "9\ta\ta\t_\t_\t_\t0\troot\t0:root\t_\r\n" + ] + } + ], + "source": [ + "! head {CONLLU_DIR}/pdbc-train.conllu" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "TF_zajecia", + "language": "python", + "name": "tf_zajecia" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.6" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/COMBO/ParseValAndTrain.ipynb a/COMBO/ParseValAndTrain.ipynb new file mode 100644 index 0000000..a8e8ad0 --- /dev/null +++ a/COMBO/ParseValAndTrain.ipynb @@ -0,0 +1,1213 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "aabfb24b", + "metadata": {}, + "outputs": [], + "source": [ + "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'" + ] + }, + { + "cell_type": "markdown", + "id": "787fff78", + "metadata": {}, + "source": [ + "Main model" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "1d9daaa9", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:49:31.448594 140072765682752 archival.py:184] loading archive file model-pdbc/model.tar.gz\n", + "I0407 10:49:31.449148 140072765682752 archival.py:263] extracting archive file model-pdbc/model.tar.gz to temp dir /tmp/tmp_htckuhc\n", + "I0407 10:49:48.075045 140072765682752 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:49:48.075561 140072765682752 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:49:48.075693 140072765682752 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:49:48.075764 140072765682752 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:49:48.075832 140072765682752 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:49:48.075901 140072765682752 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:49:48.076193 140072765682752 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:49:48.076388 140072765682752 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:49:48.076621 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:48.076697 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:48.076790 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:48.076939 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:48.077063 140072765682752 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:49:48.077118 140072765682752 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:49:48.077185 140072765682752 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:49:48.077238 140072765682752 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:49:48.077383 140072765682752 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:49:48.077555 140072765682752 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:49:48.077628 140072765682752 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:49:48.077702 140072765682752 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:49:48.077838 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:49:48.078031 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:49:48.078231 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:48.078300 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:48.078378 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:48.078666 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:48.078786 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:49:48.078862 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:49:48.078916 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:49:48.078969 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:49:48.079103 140072765682752 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:49:48.079328 140072765682752 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:49:48.079406 140072765682752 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:49:48.079461 140072765682752 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:49:48.079525 140072765682752 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:49:48.079628 140072765682752 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:49:51.185825 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:49:51.186234 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:49:51.186336 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:49:51.186398 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:49:51.186465 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:49:51.186517 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:49:51.186579 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:49:51.186631 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:49:51.186791 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:49:51.186975 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:49:51.187041 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:49:51.187107 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:49:51.187170 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:49:51.187220 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:49:51.187275 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:49:51.187334 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:49:51.187556 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:49:51.187731 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:49:51.187935 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:51.187995 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:51.188073 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:51.188217 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:51.188334 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:49:51.188398 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:49:51.188460 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:49:51.188522 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:49:51.188614 140072765682752 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:49:51.188712 140072765682752 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:49:51.188802 140072765682752 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:49:51.188952 140072765682752 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:49:51.189191 140072765682752 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:49:51.189266 140072765682752 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:49:51.189324 140072765682752 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:49:51.189382 140072765682752 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:49:51.189436 140072765682752 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:49:51.189675 140072765682752 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:49:51.189843 140072765682752 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:49:51.190060 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:51.190128 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:51.190197 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:51.190324 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:51.190443 140072765682752 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:49:51.190508 140072765682752 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:49:51.190564 140072765682752 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:49:51.190627 140072765682752 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:49:51.190772 140072765682752 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:49:51.190932 140072765682752 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:49:51.191003 140072765682752 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:49:51.191065 140072765682752 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:49:51.191206 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:49:51.191369 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:49:51.191561 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:51.191629 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:51.191706 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:51.191827 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:51.191938 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:49:51.191999 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:49:51.192067 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:49:51.192142 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:49:51.192281 140072765682752 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:49:51.192501 140072765682752 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:49:51.192575 140072765682752 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:49:51.192638 140072765682752 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:49:51.192698 140072765682752 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:49:51.192795 140072765682752 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:49:51.194080 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:49:51.194318 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:49:51.194404 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:49:51.194471 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:49:51.194532 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:49:51.194586 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:49:51.194648 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:49:51.194708 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:49:51.194854 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:49:51.195033 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:49:51.195105 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:49:51.195167 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:49:51.195222 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:49:51.195280 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:49:51.195338 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:49:51.195398 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:49:51.195601 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:49:51.195774 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:49:51.195971 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:49:51.196039 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:49:51.196113 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:49:51.196244 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:49:51.196364 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:49:51.196430 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:49:51.196492 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:49:51.196552 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:49:51.196640 140072765682752 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:49:51.196732 140072765682752 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:49:51.196815 140072765682752 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:49:51.197346 140072765682752 params.py:248] vocabulary.type = from_instances_extended\n", + "I0407 10:49:51.197421 140072765682752 vocabulary.py:323] Loading token dictionary from /tmp/tmp_htckuhc/vocabulary.\n", + "I0407 10:49:51.197736 140072765682752 filelock.py:254] Lock 140069359832176 acquired on /tmp/tmp_htckuhc/vocabulary/.lock\n", + "I0407 10:49:51.198361 140072765682752 filelock.py:317] Lock 140069359832176 released on /tmp/tmp_htckuhc/vocabulary/.lock\n", + "I0407 10:49:51.198865 140072765682752 params.py:248] model.type = semantic_multitask\n", + "I0407 10:49:51.199399 140072765682752 params.py:248] model.text_field_embedder.type = basic\n", + "I0407 10:49:51.199762 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "I0407 10:49:51.199955 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "I0407 10:49:51.200206 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "I0407 10:49:51.200286 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "I0407 10:49:51.200380 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n", + "I0407 10:49:51.200467 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "I0407 10:49:51.200556 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "I0407 10:49:51.200649 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "I0407 10:49:51.200745 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "I0407 10:49:51.200886 140072765682752 params.py:248] type = relu\n", + "I0407 10:49:51.201073 140072765682752 params.py:248] type = relu\n", + "I0407 10:49:51.201222 140072765682752 params.py:248] type = linear\n", + "I0407 10:49:51.208180 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "I0407 10:49:51.208718 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "I0407 10:49:51.208946 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:49:51.209028 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "I0407 10:49:51.209110 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f646dd85280>\n", + "I0407 10:49:51.209182 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "I0407 10:49:51.209239 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "I0407 10:49:51.209295 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "I0407 10:49:51.209401 140072765682752 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:49:51.209471 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n", + "I0407 10:49:58.747374 140072765682752 params.py:248] model.seq_encoder.type = combo_encoder\n", + "I0407 10:49:58.747746 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n", + "I0407 10:49:58.747819 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "I0407 10:49:58.747869 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "I0407 10:49:58.747919 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "I0407 10:49:58.747966 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "I0407 10:49:58.748013 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n", + "I0407 10:49:59.084017 140072765682752 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n", + "I0407 10:49:59.084280 140072765682752 params.py:248] model.use_sample_weight = True\n", + "I0407 10:49:59.084377 140072765682752 params.py:248] model.lemmatizer = None\n", + "I0407 10:49:59.084436 140072765682752 params.py:248] model.upos_tagger = None\n", + "I0407 10:49:59.084487 140072765682752 params.py:248] model.xpos_tagger = None\n", + "I0407 10:49:59.084537 140072765682752 params.py:248] model.semantic_relation = None\n", + "I0407 10:49:59.084585 140072765682752 params.py:248] model.morphological_feat = None\n", + "I0407 10:49:59.084832 140072765682752 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "I0407 10:49:59.085025 140072765682752 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n", + "I0407 10:49:59.085301 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "I0407 10:49:59.085365 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "I0407 10:49:59.085421 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "I0407 10:49:59.085520 140072765682752 params.py:248] type = tanh\n", + "I0407 10:49:59.085608 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "I0407 10:49:59.089095 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "I0407 10:49:59.089183 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "I0407 10:49:59.089244 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "I0407 10:49:59.089346 140072765682752 params.py:248] type = tanh\n", + "I0407 10:49:59.089423 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "I0407 10:49:59.092701 140072765682752 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "I0407 10:49:59.092917 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n", + "I0407 10:49:59.092972 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n", + "I0407 10:49:59.093022 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n", + "I0407 10:49:59.093108 140072765682752 params.py:248] type = tanh\n", + "I0407 10:49:59.093183 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "I0407 10:49:59.094336 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "I0407 10:49:59.094411 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "I0407 10:49:59.094463 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "I0407 10:49:59.094551 140072765682752 params.py:248] type = tanh\n", + "I0407 10:49:59.094618 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "I0407 10:49:59.095806 140072765682752 params.py:248] model.enhanced_dependency_relation = None\n", + "I0407 10:49:59.096206 140072765682752 params.py:248] model.regularizer.regexes.0.1.type = l2\n", + "I0407 10:49:59.096345 140072765682752 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n", + "I0407 10:49:59.096471 140072765682752 params.py:248] model.regularizer.regexes.1.1.type = l2\n", + "I0407 10:49:59.096584 140072765682752 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n", + "I0407 10:49:59.096696 140072765682752 params.py:248] model.regularizer.regexes.2.1.type = l2\n", + "I0407 10:49:59.096809 140072765682752 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n", + "I0407 10:49:59.096917 140072765682752 params.py:248] model.regularizer.regexes.3.1.type = l2\n", + "I0407 10:49:59.097025 140072765682752 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:50:01.854557 140072765682752 archival.py:211] removing temporary unarchived model dir at /tmp/tmp_htckuhc\n", + "reading instances: 2211it [01:52, 19.69it/s]\n" + ] + } + ], + "source": [ + "! {COMBO} --mode predict \\\n", + " --cuda_device 0 \\\n", + " --model_path model-pdbc/model.tar.gz \\\n", + " --input_file connlu/pdbc-validation.conllu \\\n", + " --output_file connlu/pdbc-validation-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "11f1b7b1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n", + "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n", + "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n", + "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n", + "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n", + "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n", + "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n", + "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n", + "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-validation.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "8fa72124", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n", + "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n", + "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n", + "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n", + "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n", + "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n", + "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n", + "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n", + "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-validation-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "dde6dd31", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:52:00.220404 139754138821696 archival.py:184] loading archive file model-pdbc/model.tar.gz\n", + "I0407 10:52:00.221079 139754138821696 archival.py:263] extracting archive file model-pdbc/model.tar.gz to temp dir /tmp/tmp2jhqu3i6\n", + "I0407 10:52:16.996590 139754138821696 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:52:16.997079 139754138821696 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:52:16.997236 139754138821696 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:52:16.997326 139754138821696 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:52:16.997391 139754138821696 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:52:16.997456 139754138821696 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:52:16.997756 139754138821696 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:52:16.997950 139754138821696 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:52:16.998211 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:16.998285 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:16.998367 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:16.998522 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:16.998643 139754138821696 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:52:16.998707 139754138821696 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:52:16.998770 139754138821696 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:52:16.998831 139754138821696 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:52:16.998980 139754138821696 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:52:16.999143 139754138821696 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:52:16.999213 139754138821696 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:52:16.999269 139754138821696 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:52:16.999412 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:52:16.999578 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:52:16.999774 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:16.999842 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:16.999923 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:17.000045 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:17.000156 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:52:17.000220 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:52:17.000282 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:52:17.000344 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:52:17.000521 139754138821696 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:52:17.000770 139754138821696 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:52:17.000865 139754138821696 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:52:17.000947 139754138821696 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:52:17.001028 139754138821696 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:52:17.001172 139754138821696 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:52:20.459573 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:52:20.459947 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:52:20.460046 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:52:20.460119 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:52:20.460172 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:52:20.460235 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:52:20.460288 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:52:20.460351 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:52:20.460508 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:52:20.460695 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:52:20.460773 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:52:20.460840 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:52:20.460901 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:52:20.460962 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:52:20.461021 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:52:20.461083 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:52:20.461313 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:52:20.461496 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:52:20.461706 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:20.461774 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:20.461853 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:20.462028 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:20.462157 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:52:20.462226 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:52:20.462283 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:52:20.462336 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:52:20.462417 139754138821696 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:52:20.462514 139754138821696 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:52:20.462607 139754138821696 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:52:20.462767 139754138821696 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:52:20.463083 139754138821696 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:52:20.463172 139754138821696 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:52:20.463237 139754138821696 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:52:20.463301 139754138821696 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:52:20.463361 139754138821696 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:52:20.463605 139754138821696 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:52:20.463779 139754138821696 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:52:20.463980 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:20.464051 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:20.464129 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:20.464254 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:20.464366 139754138821696 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:52:20.464429 139754138821696 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:52:20.464490 139754138821696 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:52:20.464552 139754138821696 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:52:20.464691 139754138821696 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:52:20.464847 139754138821696 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:52:20.464918 139754138821696 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:52:20.464980 139754138821696 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:52:20.465120 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:52:20.465285 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:52:20.465479 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:20.465544 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:20.465618 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:20.465741 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:20.465851 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:52:20.465914 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:52:20.466024 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:52:20.466112 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:52:20.466268 139754138821696 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:52:20.466485 139754138821696 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:52:20.466559 139754138821696 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:52:20.466621 139754138821696 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:52:20.466682 139754138821696 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:52:20.466777 139754138821696 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:52:20.468071 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:52:20.468319 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:52:20.468404 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:52:20.468464 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:52:20.468523 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:52:20.468573 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:52:20.468636 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:52:20.468697 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:52:20.468832 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:52:20.469012 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:52:20.469086 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:52:20.469144 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:52:20.469196 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:52:20.469256 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:52:20.469320 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:52:20.469382 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:52:20.469586 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:52:20.469758 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:52:20.469957 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:52:20.470050 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:52:20.470128 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:52:20.470261 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:52:20.470381 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:52:20.470448 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:52:20.470509 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:52:20.470579 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:52:20.470668 139754138821696 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:52:20.470764 139754138821696 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:52:20.470849 139754138821696 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:52:20.471387 139754138821696 params.py:248] vocabulary.type = from_instances_extended\n", + "I0407 10:52:20.471461 139754138821696 vocabulary.py:323] Loading token dictionary from /tmp/tmp2jhqu3i6/vocabulary.\n", + "I0407 10:52:20.471798 139754138821696 filelock.py:254] Lock 139750732975216 acquired on /tmp/tmp2jhqu3i6/vocabulary/.lock\n", + "I0407 10:52:20.472387 139754138821696 filelock.py:317] Lock 139750732975216 released on /tmp/tmp2jhqu3i6/vocabulary/.lock\n", + "I0407 10:52:20.472922 139754138821696 params.py:248] model.type = semantic_multitask\n", + "I0407 10:52:20.473455 139754138821696 params.py:248] model.text_field_embedder.type = basic\n", + "I0407 10:52:20.473808 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "I0407 10:52:20.474030 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "I0407 10:52:20.474286 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "I0407 10:52:20.474377 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "I0407 10:52:20.474480 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n", + "I0407 10:52:20.474578 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "I0407 10:52:20.474673 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "I0407 10:52:20.474768 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "I0407 10:52:20.474864 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "I0407 10:52:20.475005 139754138821696 params.py:248] type = relu\n", + "I0407 10:52:20.475197 139754138821696 params.py:248] type = relu\n", + "I0407 10:52:20.475347 139754138821696 params.py:248] type = linear\n", + "I0407 10:52:20.481609 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "I0407 10:52:20.482178 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "I0407 10:52:20.482446 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:52:20.482533 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "I0407 10:52:20.482632 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f1a3e346280>\n", + "I0407 10:52:20.482703 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "I0407 10:52:20.482769 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "I0407 10:52:20.482831 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "I0407 10:52:20.482933 139754138821696 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:52:20.483003 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:52:28.699278 139754138821696 params.py:248] model.seq_encoder.type = combo_encoder\n", + "I0407 10:52:28.699747 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n", + "I0407 10:52:28.699841 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "I0407 10:52:28.699910 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "I0407 10:52:28.699976 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "I0407 10:52:28.700042 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "I0407 10:52:28.700106 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n", + "I0407 10:52:29.089101 139754138821696 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n", + "I0407 10:52:29.089426 139754138821696 params.py:248] model.use_sample_weight = True\n", + "I0407 10:52:29.089556 139754138821696 params.py:248] model.lemmatizer = None\n", + "I0407 10:52:29.089638 139754138821696 params.py:248] model.upos_tagger = None\n", + "I0407 10:52:29.089704 139754138821696 params.py:248] model.xpos_tagger = None\n", + "I0407 10:52:29.089766 139754138821696 params.py:248] model.semantic_relation = None\n", + "I0407 10:52:29.089827 139754138821696 params.py:248] model.morphological_feat = None\n", + "I0407 10:52:29.090160 139754138821696 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "I0407 10:52:29.090409 139754138821696 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n", + "I0407 10:52:29.090762 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "I0407 10:52:29.090843 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "I0407 10:52:29.090915 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "I0407 10:52:29.091041 139754138821696 params.py:248] type = tanh\n", + "I0407 10:52:29.091149 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "I0407 10:52:29.096003 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "I0407 10:52:29.096106 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "I0407 10:52:29.096185 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "I0407 10:52:29.096311 139754138821696 params.py:248] type = tanh\n", + "I0407 10:52:29.096407 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "I0407 10:52:29.101276 139754138821696 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "I0407 10:52:29.101581 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n", + "I0407 10:52:29.101692 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n", + "I0407 10:52:29.101771 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n", + "I0407 10:52:29.101904 139754138821696 params.py:248] type = tanh\n", + "I0407 10:52:29.102032 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "I0407 10:52:29.103649 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "I0407 10:52:29.103747 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "I0407 10:52:29.103819 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "I0407 10:52:29.103948 139754138821696 params.py:248] type = tanh\n", + "I0407 10:52:29.104044 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "I0407 10:52:29.105780 139754138821696 params.py:248] model.enhanced_dependency_relation = None\n", + "I0407 10:52:29.106371 139754138821696 params.py:248] model.regularizer.regexes.0.1.type = l2\n", + "I0407 10:52:29.106555 139754138821696 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n", + "I0407 10:52:29.106724 139754138821696 params.py:248] model.regularizer.regexes.1.1.type = l2\n", + "I0407 10:52:29.106879 139754138821696 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n", + "I0407 10:52:29.107035 139754138821696 params.py:248] model.regularizer.regexes.2.1.type = l2\n", + "I0407 10:52:29.107207 139754138821696 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n", + "I0407 10:52:29.107368 139754138821696 params.py:248] model.regularizer.regexes.3.1.type = l2\n", + "I0407 10:52:29.107544 139754138821696 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n", + "I0407 10:52:32.063793 139754138821696 archival.py:211] removing temporary unarchived model dir at /tmp/tmp2jhqu3i6\n", + "reading instances: 2205it [01:49, 20.15it/s]\n" + ] + } + ], + "source": [ + "! {COMBO} --mode predict \\\n", + " --cuda_device 0 \\\n", + " --model_path model-pdbc/model.tar.gz \\\n", + " --input_file connlu/pdbc-test.conllu \\\n", + " --output_file connlu/pdbc-test-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "13748ca1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n", + "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n", + "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n", + "4\tw\tw\t_\t_\t_\t3\tadjunct_adl\t3:adjunct_adl\t_\r\n", + "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n", + "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n", + "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n", + "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n", + "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-test.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "30021124", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n", + "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n", + "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n", + "4\tw\tw\t_\t_\t_\t3\tcomp\t3:adjunct_adl\t_\r\n", + "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n", + "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n", + "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n", + "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n", + "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-test-pred.conllu" + ] + }, + { + "cell_type": "markdown", + "id": "99359d8c", + "metadata": {}, + "source": [ + "Continuous-only model" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "30a66da6", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:54:27.401382 140321380496448 archival.py:184] loading archive file model-pdbc-cont/model.tar.gz\n", + "I0407 10:54:27.402150 140321380496448 archival.py:263] extracting archive file model-pdbc-cont/model.tar.gz to temp dir /tmp/tmpuvesoi4q\n", + "I0407 10:54:43.091615 140321380496448 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:54:43.092000 140321380496448 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:54:43.092082 140321380496448 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:54:43.092129 140321380496448 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:54:43.092173 140321380496448 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:54:43.092208 140321380496448 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:54:43.092409 140321380496448 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:54:43.092535 140321380496448 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:54:43.092682 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:43.092730 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:43.092786 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:43.092888 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:43.092970 140321380496448 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:54:43.093014 140321380496448 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:54:43.093051 140321380496448 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:54:43.093093 140321380496448 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:54:43.093198 140321380496448 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:54:43.093306 140321380496448 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:54:43.093353 140321380496448 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:54:43.093388 140321380496448 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:54:43.093482 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:54:43.093593 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:54:43.093723 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:43.093769 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:43.093816 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:43.093899 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:43.093993 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:54:43.094043 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:54:43.094079 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:54:43.094121 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:54:43.094226 140321380496448 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:54:43.094377 140321380496448 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:54:43.094430 140321380496448 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:54:43.094474 140321380496448 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:54:43.094522 140321380496448 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:54:43.094592 140321380496448 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:54:45.858621 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:54:45.858990 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:54:45.859087 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:54:45.859157 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:54:45.859210 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:54:45.859268 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:54:45.859321 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:54:45.859382 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:54:45.859541 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:54:45.859729 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:54:45.859802 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:54:45.859875 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:54:45.859931 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:54:45.859991 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:54:45.860045 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:54:45.860103 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:54:45.860332 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:54:45.860523 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:54:45.860739 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:45.860809 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:45.860888 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:45.861032 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:45.861149 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:54:45.861213 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:54:45.861277 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:54:45.861337 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:54:45.861427 140321380496448 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:54:45.861522 140321380496448 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:54:45.861611 140321380496448 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:54:45.861762 140321380496448 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:54:45.862029 140321380496448 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:54:45.862116 140321380496448 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:54:45.862177 140321380496448 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:54:45.862234 140321380496448 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:54:45.862295 140321380496448 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:54:45.862535 140321380496448 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:54:45.862701 140321380496448 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:54:45.862900 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:45.862966 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:45.863043 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:45.863168 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:45.863281 140321380496448 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:54:45.863344 140321380496448 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:54:45.863406 140321380496448 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:54:45.863469 140321380496448 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:54:45.863596 140321380496448 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:54:45.863752 140321380496448 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:54:45.863821 140321380496448 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:54:45.863883 140321380496448 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:54:45.864030 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:54:45.864196 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:54:45.864392 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:45.864460 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:45.864540 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:45.864660 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:45.864772 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:54:45.864835 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:54:45.864896 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:54:45.864965 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:54:45.865104 140321380496448 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:54:45.865323 140321380496448 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:54:45.865396 140321380496448 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:54:45.865460 140321380496448 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:54:45.865518 140321380496448 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:54:45.865614 140321380496448 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:54:45.866884 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:54:45.867116 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:54:45.867190 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:54:45.867258 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:54:45.867316 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:54:45.867376 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:54:45.867437 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:54:45.867497 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:54:45.867640 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:54:45.867815 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:54:45.867887 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:54:45.867951 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:54:45.868006 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:54:45.868063 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:54:45.868122 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:54:45.868181 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:54:45.868388 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:54:45.868559 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:54:45.868757 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:54:45.868824 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:54:45.868897 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:54:45.869028 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:54:45.869139 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:54:45.869202 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:54:45.869256 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:54:45.869315 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:54:45.869398 140321380496448 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:54:45.869489 140321380496448 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:54:45.869572 140321380496448 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:54:45.870136 140321380496448 params.py:248] vocabulary.type = from_instances_extended\n", + "I0407 10:54:45.870218 140321380496448 vocabulary.py:323] Loading token dictionary from /tmp/tmpuvesoi4q/vocabulary.\n", + "I0407 10:54:45.870543 140321380496448 filelock.py:254] Lock 140317974842768 acquired on /tmp/tmpuvesoi4q/vocabulary/.lock\n", + "I0407 10:54:45.871132 140321380496448 filelock.py:317] Lock 140317974842768 released on /tmp/tmpuvesoi4q/vocabulary/.lock\n", + "I0407 10:54:45.871641 140321380496448 params.py:248] model.type = semantic_multitask\n", + "I0407 10:54:45.872183 140321380496448 params.py:248] model.text_field_embedder.type = basic\n", + "I0407 10:54:45.872548 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "I0407 10:54:45.872749 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "I0407 10:54:45.873004 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "I0407 10:54:45.873091 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "I0407 10:54:45.873195 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n", + "I0407 10:54:45.873291 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "I0407 10:54:45.873384 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "I0407 10:54:45.873478 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "I0407 10:54:45.873572 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "I0407 10:54:45.873714 140321380496448 params.py:248] type = relu\n", + "I0407 10:54:45.873904 140321380496448 params.py:248] type = relu\n", + "I0407 10:54:45.874098 140321380496448 params.py:248] type = linear\n", + "I0407 10:54:45.880232 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "I0407 10:54:45.880783 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "I0407 10:54:45.881011 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:54:45.881093 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "I0407 10:54:45.881184 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f9e50745280>\n", + "I0407 10:54:45.881261 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "I0407 10:54:45.881328 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "I0407 10:54:45.881389 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "I0407 10:54:45.881492 140321380496448 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:54:45.881562 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:54:52.911276 140321380496448 params.py:248] model.seq_encoder.type = combo_encoder\n", + "I0407 10:54:52.911743 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n", + "I0407 10:54:52.911836 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "I0407 10:54:52.911902 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "I0407 10:54:52.911965 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "I0407 10:54:52.912029 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "I0407 10:54:52.912090 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n", + "I0407 10:54:53.279199 140321380496448 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n", + "I0407 10:54:53.279505 140321380496448 params.py:248] model.use_sample_weight = True\n", + "I0407 10:54:53.279624 140321380496448 params.py:248] model.lemmatizer = None\n", + "I0407 10:54:53.279695 140321380496448 params.py:248] model.upos_tagger = None\n", + "I0407 10:54:53.279757 140321380496448 params.py:248] model.xpos_tagger = None\n", + "I0407 10:54:53.279815 140321380496448 params.py:248] model.semantic_relation = None\n", + "I0407 10:54:53.279873 140321380496448 params.py:248] model.morphological_feat = None\n", + "I0407 10:54:53.280155 140321380496448 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "I0407 10:54:53.280393 140321380496448 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n", + "I0407 10:54:53.280741 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "I0407 10:54:53.280819 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "I0407 10:54:53.280887 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "I0407 10:54:53.281012 140321380496448 params.py:248] type = tanh\n", + "I0407 10:54:53.281121 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "I0407 10:54:53.285843 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "I0407 10:54:53.286010 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "I0407 10:54:53.286088 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "I0407 10:54:53.286234 140321380496448 params.py:248] type = tanh\n", + "I0407 10:54:53.286334 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "I0407 10:54:53.290788 140321380496448 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "I0407 10:54:53.291093 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n", + "I0407 10:54:53.291184 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n", + "I0407 10:54:53.291281 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n", + "I0407 10:54:53.291444 140321380496448 params.py:248] type = tanh\n", + "I0407 10:54:53.291567 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "I0407 10:54:53.293048 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "I0407 10:54:53.293147 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "I0407 10:54:53.293218 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "I0407 10:54:53.293342 140321380496448 params.py:248] type = tanh\n", + "I0407 10:54:53.293437 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "I0407 10:54:53.295091 140321380496448 params.py:248] model.enhanced_dependency_relation = None\n", + "I0407 10:54:53.295609 140321380496448 params.py:248] model.regularizer.regexes.0.1.type = l2\n", + "I0407 10:54:53.295784 140321380496448 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n", + "I0407 10:54:53.295953 140321380496448 params.py:248] model.regularizer.regexes.1.1.type = l2\n", + "I0407 10:54:53.296107 140321380496448 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n", + "I0407 10:54:53.296261 140321380496448 params.py:248] model.regularizer.regexes.2.1.type = l2\n", + "I0407 10:54:53.296412 140321380496448 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n", + "I0407 10:54:53.296564 140321380496448 params.py:248] model.regularizer.regexes.3.1.type = l2\n", + "I0407 10:54:53.296715 140321380496448 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n", + "I0407 10:54:56.194218 140321380496448 archival.py:211] removing temporary unarchived model dir at /tmp/tmpuvesoi4q\n", + "reading instances: 1980it [01:33, 21.15it/s]\n" + ] + } + ], + "source": [ + "! {COMBO} --mode predict \\\n", + " --cuda_device 0 \\\n", + " --model_path model-pdbc-cont/model.tar.gz \\\n", + " --input_file connlu/pdbc-cont-validation.conllu \\\n", + " --output_file connlu/pdbc-cont-validation-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "cfe7a3c4", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n", + "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n", + "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n", + "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n", + "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n", + "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n", + "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n", + "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n", + "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-cont-validation.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "7dba9571", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n", + "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n", + "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n", + "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n", + "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n", + "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n", + "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n", + "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n", + "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-cont-validation-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "679601c2", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:56:35.295660 140254825452608 archival.py:184] loading archive file model-pdbc-cont/model.tar.gz\n", + "I0407 10:56:35.296370 140254825452608 archival.py:263] extracting archive file model-pdbc-cont/model.tar.gz to temp dir /tmp/tmpdhtf4et1\n", + "I0407 10:56:52.876630 140254825452608 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:56:52.877122 140254825452608 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:56:52.877243 140254825452608 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:56:52.877313 140254825452608 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:56:52.877380 140254825452608 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:56:52.877446 140254825452608 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:56:52.877737 140254825452608 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:56:52.877938 140254825452608 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:56:52.878201 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:52.878276 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:52.878360 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:52.878507 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:52.878633 140254825452608 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:56:52.878702 140254825452608 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:56:52.878761 140254825452608 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:56:52.878825 140254825452608 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:56:52.878969 140254825452608 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:56:52.879144 140254825452608 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:56:52.879218 140254825452608 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:56:52.879282 140254825452608 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:56:52.879426 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:56:52.879594 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:56:52.879792 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:52.879862 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:52.879944 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:52.880068 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:52.880184 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:56:52.880254 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:56:52.880316 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:56:52.880378 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:56:52.880523 140254825452608 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:56:52.880748 140254825452608 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:56:52.880829 140254825452608 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:56:52.880893 140254825452608 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:56:52.880957 140254825452608 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:56:52.881069 140254825452608 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:56:55.893562 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:56:55.894115 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:56:55.894256 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:56:55.894343 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:56:55.894395 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:56:55.894465 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:56:55.894520 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:56:55.894590 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:56:55.894762 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:56:55.894958 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:56:55.895048 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:56:55.895111 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:56:55.895176 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:56:55.895228 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:56:55.895297 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:56:55.895349 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:56:55.895593 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:56:55.895786 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:56:55.896016 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:55.896095 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:55.896188 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:55.896353 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:55.896480 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:56:55.896552 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:56:55.896607 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:56:55.896675 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:56:55.896760 140254825452608 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:56:55.896864 140254825452608 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:56:55.896962 140254825452608 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:56:55.897153 140254825452608 params.py:248] dataset_reader.type = conllu\n", + "I0407 10:56:55.897414 140254825452608 params.py:248] dataset_reader.lazy = False\n", + "I0407 10:56:55.897499 140254825452608 params.py:248] dataset_reader.cache_directory = None\n", + "I0407 10:56:55.897570 140254825452608 params.py:248] dataset_reader.max_instances = None\n", + "I0407 10:56:55.897637 140254825452608 params.py:248] dataset_reader.manual_distributed_sharding = False\n", + "I0407 10:56:55.897707 140254825452608 params.py:248] dataset_reader.manual_multi_process_sharding = False\n", + "I0407 10:56:55.897995 140254825452608 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n", + "I0407 10:56:55.898183 140254825452608 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n", + "I0407 10:56:55.898398 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:55.898473 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:55.898542 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:55.898677 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:55.898799 140254825452608 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n", + "I0407 10:56:55.898869 140254825452608 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n", + "I0407 10:56:55.898936 140254825452608 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n", + "I0407 10:56:55.898998 140254825452608 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "I0407 10:56:55.899158 140254825452608 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n", + "I0407 10:56:55.899337 140254825452608 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n", + "I0407 10:56:55.899414 140254825452608 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n", + "I0407 10:56:55.899485 140254825452608 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "I0407 10:56:55.899629 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "I0407 10:56:55.899797 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "I0407 10:56:55.899995 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:55.900055 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:55.900130 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:55.900250 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:55.900363 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n", + "I0407 10:56:55.900426 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n", + "I0407 10:56:55.900486 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "I0407 10:56:55.900547 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "I0407 10:56:55.900689 140254825452608 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "I0407 10:56:55.900916 140254825452608 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "I0407 10:56:55.900995 140254825452608 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:56:55.901061 140254825452608 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n", + "I0407 10:56:55.901125 140254825452608 params.py:248] dataset_reader.token_indexers.token.max_length = None\n", + "I0407 10:56:55.901226 140254825452608 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:56:55.902561 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n", + "I0407 10:56:55.902824 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n", + "I0407 10:56:55.902909 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "I0407 10:56:55.902969 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n", + "I0407 10:56:55.903034 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n", + "I0407 10:56:55.903095 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "I0407 10:56:55.903159 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:56:55.903219 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "I0407 10:56:55.903364 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n", + "I0407 10:56:55.903547 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "I0407 10:56:55.903621 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "I0407 10:56:55.903687 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "I0407 10:56:55.903748 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "I0407 10:56:55.903811 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "I0407 10:56:55.903868 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "I0407 10:56:55.903931 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "I0407 10:56:55.904146 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "I0407 10:56:55.904325 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "I0407 10:56:55.904539 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "I0407 10:56:55.904611 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "I0407 10:56:55.904691 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "I0407 10:56:55.904827 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "I0407 10:56:55.904946 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n", + "I0407 10:56:55.905013 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n", + "I0407 10:56:55.905084 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "I0407 10:56:55.905149 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "I0407 10:56:55.905237 140254825452608 params.py:248] dataset_reader.features = ['token', 'char']\n", + "I0407 10:56:55.905334 140254825452608 params.py:248] dataset_reader.targets = ['head', 'deprel']\n", + "I0407 10:56:55.905422 140254825452608 params.py:248] dataset_reader.use_sem = False\n", + "I0407 10:56:55.906047 140254825452608 params.py:248] vocabulary.type = from_instances_extended\n", + "I0407 10:56:55.906157 140254825452608 vocabulary.py:323] Loading token dictionary from /tmp/tmpdhtf4et1/vocabulary.\n", + "I0407 10:56:55.906635 140254825452608 filelock.py:254] Lock 140251419626896 acquired on /tmp/tmpdhtf4et1/vocabulary/.lock\n", + "I0407 10:56:55.907354 140254825452608 filelock.py:317] Lock 140251419626896 released on /tmp/tmpdhtf4et1/vocabulary/.lock\n", + "I0407 10:56:55.907914 140254825452608 params.py:248] model.type = semantic_multitask\n", + "I0407 10:56:55.908506 140254825452608 params.py:248] model.text_field_embedder.type = basic\n", + "I0407 10:56:55.908878 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "I0407 10:56:55.909080 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "I0407 10:56:55.909353 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "I0407 10:56:55.909446 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "I0407 10:56:55.909554 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0407 10:56:55.909654 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "I0407 10:56:55.909750 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "I0407 10:56:55.909847 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "I0407 10:56:55.909946 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "I0407 10:56:55.910176 140254825452608 params.py:248] type = relu\n", + "I0407 10:56:55.910410 140254825452608 params.py:248] type = relu\n", + "I0407 10:56:55.910567 140254825452608 params.py:248] type = linear\n", + "I0407 10:56:55.917278 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "I0407 10:56:55.917941 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "I0407 10:56:55.918267 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "I0407 10:56:55.918358 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "I0407 10:56:55.918458 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f8ed1745280>\n", + "I0407 10:56:55.918541 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "I0407 10:56:55.918609 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "I0407 10:56:55.918674 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "I0407 10:56:55.918785 140254825452608 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "I0407 10:56:55.918858 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n", + "I0407 10:57:03.624983 140254825452608 params.py:248] model.seq_encoder.type = combo_encoder\n", + "I0407 10:57:03.625626 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n", + "I0407 10:57:03.625742 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "I0407 10:57:03.625796 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "I0407 10:57:03.625844 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "I0407 10:57:03.625942 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "I0407 10:57:03.626068 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n", + "I0407 10:57:03.933019 140254825452608 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n", + "I0407 10:57:03.933302 140254825452608 params.py:248] model.use_sample_weight = True\n", + "I0407 10:57:03.933391 140254825452608 params.py:248] model.lemmatizer = None\n", + "I0407 10:57:03.933440 140254825452608 params.py:248] model.upos_tagger = None\n", + "I0407 10:57:03.933486 140254825452608 params.py:248] model.xpos_tagger = None\n", + "I0407 10:57:03.933528 140254825452608 params.py:248] model.semantic_relation = None\n", + "I0407 10:57:03.933570 140254825452608 params.py:248] model.morphological_feat = None\n", + "I0407 10:57:03.933835 140254825452608 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "I0407 10:57:03.934096 140254825452608 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n", + "I0407 10:57:03.934389 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "I0407 10:57:03.934459 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "I0407 10:57:03.934515 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "I0407 10:57:03.934614 140254825452608 params.py:248] type = tanh\n", + "I0407 10:57:03.934703 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "I0407 10:57:03.938141 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "I0407 10:57:03.938247 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "I0407 10:57:03.938306 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "I0407 10:57:03.938404 140254825452608 params.py:248] type = tanh\n", + "I0407 10:57:03.938489 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "I0407 10:57:03.941669 140254825452608 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "I0407 10:57:03.941908 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n", + "I0407 10:57:03.941985 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n", + "I0407 10:57:03.942037 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n", + "I0407 10:57:03.942123 140254825452608 params.py:248] type = tanh\n", + "I0407 10:57:03.942194 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "I0407 10:57:03.943288 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "I0407 10:57:03.943376 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "I0407 10:57:03.943423 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "I0407 10:57:03.943510 140254825452608 params.py:248] type = tanh\n", + "I0407 10:57:03.943577 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "I0407 10:57:03.944838 140254825452608 params.py:248] model.enhanced_dependency_relation = None\n", + "I0407 10:57:03.945286 140254825452608 params.py:248] model.regularizer.regexes.0.1.type = l2\n", + "I0407 10:57:03.945443 140254825452608 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n", + "I0407 10:57:03.945568 140254825452608 params.py:248] model.regularizer.regexes.1.1.type = l2\n", + "I0407 10:57:03.945679 140254825452608 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n", + "I0407 10:57:03.945787 140254825452608 params.py:248] model.regularizer.regexes.2.1.type = l2\n", + "I0407 10:57:03.945892 140254825452608 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n", + "I0407 10:57:03.946047 140254825452608 params.py:248] model.regularizer.regexes.3.1.type = l2\n", + "I0407 10:57:03.946158 140254825452608 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n", + "I0407 10:57:06.549506 140254825452608 archival.py:211] removing temporary unarchived model dir at /tmp/tmpdhtf4et1\n", + "reading instances: 1990it [01:39, 20.00it/s]\n" + ] + } + ], + "source": [ + "! {COMBO} --mode predict \\\n", + " --cuda_device 0 \\\n", + " --model_path model-pdbc-cont/model.tar.gz \\\n", + " --input_file connlu/pdbc-cont-test.conllu \\\n", + " --output_file connlu/pdbc-cont-test-pred.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "ddc3986b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n", + "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n", + "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n", + "4\tw\tw\t_\t_\t_\t3\tadjunct_adl\t3:adjunct_adl\t_\r\n", + "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n", + "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n", + "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n", + "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n", + "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-cont-test.conllu" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "34aa16d9", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n", + "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n", + "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n", + "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n", + "4\tw\tw\t_\t_\t_\t3\tcomp\t3:adjunct_adl\t_\r\n", + "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n", + "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n", + "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n", + "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n", + "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n" + ] + } + ], + "source": [ + "! head connlu/pdbc-cont-test-pred.conllu" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "combo_python39", + "language": "python", + "name": "combo_python39" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.16" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/COMBO/TrainContModel.ipynb a/COMBO/TrainContModel.ipynb new file mode 100644 index 0000000..8c58186 --- /dev/null +++ a/COMBO/TrainContModel.ipynb @@ -0,0 +1,14293 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "e613a4cf", + "metadata": {}, + "outputs": [], + "source": [ + "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "e2563423", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0406 22:49:10.502099 139680283460672 params.py:248] include_in_archive = None\n", + "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - random_seed = 8787\n", + "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - numpy_seed = 8787\n", + "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - pytorch_seed = 8787\n", + "2023-04-06 22:49:10,504 - INFO - allennlp.common.checks - Pytorch version: 1.13.1\n", + "2023-04-06 22:49:10,505 - INFO - allennlp.common.params - type = default\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.type = conllu\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.lazy = False\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.cache_directory = None\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.max_instances = None\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.manual_distributed_sharding = False\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.manual_multi_process_sharding = False\n", + "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.type = characters_const_padding\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.namespace = token_characters\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.start_tokens = None\n", + "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.end_tokens = None\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.min_padding_length = 32\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.type = feats_indexer\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.namespace = feats\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.feature_name = feats_\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.start_tokens = None\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.end_tokens = None\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.namespace = tags\n", + "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.max_length = None\n", + "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.type = single_id\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.namespace = upostag\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.start_tokens = None\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.end_tokens = None\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.type = single_id\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.start_tokens = None\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.end_tokens = None\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.features = ['token', 'char']\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.targets = ['head', 'deprel']\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.use_sem = False\n", + "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - train_data_path = connlu/pdbc-cont-train.conllu\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - datasets_for_vocab_creation = ['train']\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_dataset_reader = None\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_data_path = connlu/pdbc-cont-validation.conllu\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_data_loader = None\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - test_data_path = None\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - evaluate_on_test = False\n", + "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - batch_weight_key = \n", + "2023-04-06 22:49:13,448 - INFO - allennlp.training.util - Reading training data from connlu/pdbc-cont-train.conllu\n", + "reading instances: 0it [00:00, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "reading instances: 3878it [00:02, 1938.62it/s]\n", + "reading instances: 8280it [00:04, 2010.38it/s]\n", + "reading instances: 11587it [00:06, 1750.85it/s]\n", + "reading instances: 15202it [00:08, 1679.50it/s]\n", + "reading instances: 15903it [00:09, 1757.51it/s]\n", + "2023-04-06 22:49:22,498 - INFO - allennlp.training.util - Reading validation data from connlu/pdbc-cont-validation.conllu\n", + "reading instances: 0it [00:00, ?it/s]\n", + "reading instances: 1980it [00:00, 3415.26it/s]\n", + "2023-04-06 22:49:23,078 - INFO - allennlp.commands.train - From dataset instances, train will be considered for vocabulary creation.\n", + "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.type = from_instances_extended\n", + "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.min_count = None\n", + "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.max_vocab_size = None\n", + "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.non_padded_namespaces = ['head_labels']\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.pretrained_files = None\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.only_include_pretrained_words = True\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.min_pretrained_embeddings = None\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.padding_token = __PAD__\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.oov_token = _\n", + "2023-04-06 22:49:23,079 - INFO - allennlp.data.vocabulary - Fitting token dictionary from dataset.\n", + "building vocab: 0it [00:00, ?it/s]\n", + "building vocab: 15903it [00:01, 10066.76it/s]\n", + "2023-04-06 22:49:24,659 - INFO - allennlp.common.params - model.type = semantic_multitask\n", + "2023-04-06 22:49:24,660 - INFO - allennlp.common.params - model.text_field_embedder.type = basic\n", + "2023-04-06 22:49:24,660 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - type = relu\n", + "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - type = relu\n", + "2023-04-06 22:49:24,662 - INFO - allennlp.common.params - type = linear\n", + "2023-04-06 22:49:24,666 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f090c144280>\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "2023-04-06 22:49:24,668 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "2023-04-06 22:49:24,668 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.type = combo_encoder\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.input_size = 164\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "2023-04-06 22:49:33,578 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.use_highway = False\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.seq_encoder.layer_dropout_probability = 0.33\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.use_sample_weight = True\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.lemmatizer = None\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.upos_tagger = None\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.xpos_tagger = None\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.semantic_relation = None\n", + "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.morphological_feat = None\n", + "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.vocab_namespace = deprel_labels\n", + "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "2023-04-06 22:49:34,207 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "2023-04-06 22:49:34,212 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.out_features = 128\n", + "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.activation = tanh\n", + "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.enhanced_dependency_relation = None\n", + "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.type = l2\n", + "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.alpha = 1e-06\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.type = l2\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.alpha = 1e-06\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.type = l2\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.alpha = 1e-06\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.type = l2\n", + "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.alpha = 1e-05\n", + "2023-04-06 22:49:34,219 - INFO - filelock - Lock 139674732932928 acquired on ./allennlp867qpopk/vocabulary/.lock\n", + "2023-04-06 22:49:34,220 - INFO - filelock - Lock 139674732932928 released on ./allennlp867qpopk/vocabulary/.lock\n", + "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n", + "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.batch_size = 1\n", + "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.shuffle = False\n", + "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.sampler = None\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.num_workers = 0\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.pin_memory = False\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.drop_last = False\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.timeout = 0\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n", + "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "/home/kkrasnowska/anaconda3/envs/combo_p39/lib/python3.8/site-packages/combo/data/samplers/samplers.py:51: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", + " self.batch_dataset = np.array(self.batch_dataset)[indices].tolist()\n", + "2023-04-06 22:49:34,240 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.batch_size = 1\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.shuffle = False\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.sampler = None\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.num_workers = 0\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.pin_memory = False\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.drop_last = False\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.timeout = 0\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n", + "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n", + "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n", + "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n", + "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n", + "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.type = gradient_descent_validate_n\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.patience = 1\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.validation_metric = +EM\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.num_epochs = 400\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.cuda_device = 0\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.grad_norm = None\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.grad_clipping = 5\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.distributed = None\n", + "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.world_size = 1\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.num_gradient_accumulation_steps = 1\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.use_amp = False\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.no_grad = None\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.momentum_scheduler = None\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.tensorboard_writer = None\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.moving_average = None\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.batch_callbacks = None\n", + "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.epoch_callbacks.0.type = transfer_patience\n", + "2023-04-06 22:49:34,247 - INFO - allennlp.common.params - trainer.end_callbacks = None\n", + "2023-04-06 22:49:34,247 - INFO - allennlp.common.params - trainer.trainer_callbacks = None\n", + "2023-04-06 22:49:36,168 - INFO - allennlp.common.params - trainer.optimizer.type = adam\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.parameter_groups = None\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.lr = 0.002\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.betas = [0.9, 0.9]\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.eps = 1e-08\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.weight_decay = 0.0\n", + "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.amsgrad = False\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.training.optimizers - Number of trainable parameters: 11053808\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - The following parameters are Frozen (without gradient):\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.word_embeddings.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.position_embeddings.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.token_type_embeddings.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.bias\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.bias\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.weight\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.bias\n", + "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.bias\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.weight\n", + "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.bias\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.weight\n", + "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.weight\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.bias\n", + "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.bias\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.weight\n", + "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.weight\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.bias\n", + "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.bias\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.weight\n", + "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.bias\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.weight\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.bias\n", + "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.bias\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.weight\n", + "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.bias\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.weight\n", + "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.weight\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.bias\n", + "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.weight\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.bias\n", + "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.bias\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.weight\n", + "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.bias\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.weight\n", + "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.weight\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.bias\n", + "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.weight\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.bias\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.weight\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.bias\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.weight\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.bias\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.weight\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.bias\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.weight\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.bias\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.weight\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.bias\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.weight\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.bias\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.weight\r\n", + "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.weight\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.bias\r\n", + "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.bias\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.weight\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.bias\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - The following parameters are Tunable (with gradient):\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - _head_sentinel\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.char_embed.weight\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.weight\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.bias\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.weight\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.bias\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.weight\r\n", + "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.weight\r\n", + "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.bias\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.weight\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.bias\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.weight\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.bias\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.weight\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.bias\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.weight\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.bias\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.type = combo_scheduler\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.patience = 6\r\n", + "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.decreases = 2\r\n", + "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.threshold = 0.001\r\n", + "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.type = finishing_only_checkpointer\r\n", + "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.keep_serialized_model_every_num_seconds = None\r\n", + "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.num_serialized_models_to_keep = 2\r\n", + "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.model_save_interval = None\r\n", + "2023-04-06 22:49:36,199 - INFO - combo.training.trainer - Beginning training.\r\n", + "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - Epoch 0/399\r\n", + "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.3G\r\n", + "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - GPU 0 memory usage: 1.4G\r\n", + "2023-04-06 22:49:36,206 - INFO - allennlp.training.trainer - Training\r\n", + " 0%| | 0/95 [00:00<?, ?it/s]\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0004, UAS: 0.0545, LAS: 0.0004, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.5812, partial_loss/deprel_loss: 12.1384, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5281, loss: 11.5281, batch_reg_loss: 0.1011, reg_loss: 0.1011 ||: 1%|1 | 1/95 [00:02<03:22, 2.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0534, LAS: 0.0025, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 54.5014, partial_loss/deprel_loss: 9.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 18.4440, loss: 29.0149, batch_reg_loss: 0.1003, reg_loss: 0.1007 ||: 5%|5 | 5/95 [00:04<02:32, 1.69s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0048, UAS: 0.0484, LAS: 0.0043, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 26.8907, partial_loss/deprel_loss: 10.2825, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7041, loss: 28.1204, batch_reg_loss: 0.1000, reg_loss: 0.1004 ||: 9%|9 | 9/95 [00:06<01:56, 1.35s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0075, UAS: 0.0514, LAS: 0.0053, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 16.4258, partial_loss/deprel_loss: 8.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5639, loss: 24.1295, batch_reg_loss: 0.0996, reg_loss: 0.1003 ||: 13%|#2 | 12/95 [00:08<01:35, 1.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0248, UAS: 0.0550, LAS: 0.0072, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 30.6838, partial_loss/deprel_loss: 6.7519, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6376, loss: 21.7925, batch_reg_loss: 0.0993, reg_loss: 0.1001 ||: 16%|#5 | 15/95 [00:10<01:20, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0128, UAS: 0.0582, LAS: 0.0085, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.5911, partial_loss/deprel_loss: 8.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 9.3455, loss: 19.5927, batch_reg_loss: 0.0988, reg_loss: 0.0999 ||: 20%|## | 19/95 [00:13<01:08, 1.11it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0032, UAS: 0.0579, LAS: 0.0088, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 18.6420, partial_loss/deprel_loss: 11.9442, partial_loss/cycle_loss: 0.0000, batch_loss: 13.3822, loss: 18.3815, batch_reg_loss: 0.0984, reg_loss: 0.0997 ||: 23%|##3 | 22/95 [00:15<01:01, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0279, UAS: 0.0718, LAS: 0.0148, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.8369, partial_loss/deprel_loss: 6.2066, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4307, loss: 17.0702, batch_reg_loss: 0.0980, reg_loss: 0.0995 ||: 26%|##6 | 25/95 [00:18<00:59, 1.17it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0260, UAS: 0.0776, LAS: 0.0161, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1379, partial_loss/deprel_loss: 6.0939, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4003, loss: 16.0644, batch_reg_loss: 0.0976, reg_loss: 0.0993 ||: 29%|##9 | 28/95 [00:22<01:07, 1.01s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0340, UAS: 0.0781, LAS: 0.0163, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.3717, partial_loss/deprel_loss: 6.7100, partial_loss/cycle_loss: 0.0000, batch_loss: 7.1393, loss: 15.1670, batch_reg_loss: 0.0969, reg_loss: 0.0990 ||: 34%|###3 | 32/95 [00:24<00:56, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0187, UAS: 0.0777, LAS: 0.0165, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.8800, partial_loss/deprel_loss: 8.6119, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1620, loss: 14.6762, batch_reg_loss: 0.0964, reg_loss: 0.0988 ||: 37%|###6 | 35/95 [00:27<00:51, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0104, UAS: 0.0764, LAS: 0.0161, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 13.7758, partial_loss/deprel_loss: 10.7456, partial_loss/cycle_loss: 0.0000, batch_loss: 11.4476, loss: 14.4105, batch_reg_loss: 0.0959, reg_loss: 0.0986 ||: 40%|#### | 38/95 [00:29<00:46, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0211, UAS: 0.0791, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5813, partial_loss/deprel_loss: 7.7125, partial_loss/cycle_loss: 0.0000, batch_loss: 7.7814, loss: 13.8527, batch_reg_loss: 0.0952, reg_loss: 0.0983 ||: 44%|####4 | 42/95 [00:31<00:40, 1.31it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0355, UAS: 0.0847, LAS: 0.0172, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5881, partial_loss/deprel_loss: 5.1220, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1099, loss: 13.3031, batch_reg_loss: 0.0947, reg_loss: 0.0981 ||: 47%|####7 | 45/95 [00:34<00:39, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0147, UAS: 0.0887, LAS: 0.0176, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7138, partial_loss/deprel_loss: 9.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 9.6557, loss: 12.9664, batch_reg_loss: 0.0941, reg_loss: 0.0978 ||: 51%|##### | 48/95 [00:36<00:35, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0279, UAS: 0.0896, LAS: 0.0176, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1660, partial_loss/deprel_loss: 7.7062, partial_loss/cycle_loss: 0.0000, batch_loss: 7.6917, loss: 12.7503, batch_reg_loss: 0.0935, reg_loss: 0.0976 ||: 54%|#####3 | 51/95 [00:38<00:32, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0475, UAS: 0.0943, LAS: 0.0184, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.6122, partial_loss/deprel_loss: 5.5939, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4905, loss: 12.4588, batch_reg_loss: 0.0929, reg_loss: 0.0974 ||: 57%|#####6 | 54/95 [00:40<00:30, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0095, UAS: 0.0959, LAS: 0.0184, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1111, partial_loss/deprel_loss: 9.9458, partial_loss/cycle_loss: 0.0000, batch_loss: 10.0712, loss: 12.2757, batch_reg_loss: 0.0923, reg_loss: 0.0971 ||: 60%|###### | 57/95 [00:43<00:29, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0295, UAS: 0.1010, LAS: 0.0194, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.3592, partial_loss/deprel_loss: 8.1111, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0525, loss: 12.0223, batch_reg_loss: 0.0918, reg_loss: 0.0968 ||: 63%|######3 | 60/95 [00:45<00:27, 1.29it/s] \n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0211, UAS: 0.1046, LAS: 0.0201, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.1219, partial_loss/deprel_loss: 10.9192, partial_loss/cycle_loss: 0.0000, batch_loss: 11.2509, loss: 11.8418, batch_reg_loss: 0.0912, reg_loss: 0.0966 ||: 66%|######6 | 63/95 [00:48<00:24, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0635, UAS: 0.1096, LAS: 0.0216, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5291, partial_loss/deprel_loss: 5.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5181, loss: 11.5928, batch_reg_loss: 0.0906, reg_loss: 0.0963 ||: 69%|######9 | 66/95 [00:50<00:22, 1.32it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0398, UAS: 0.1150, LAS: 0.0234, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7731, partial_loss/deprel_loss: 9.1982, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4030, loss: 11.3990, batch_reg_loss: 0.0898, reg_loss: 0.0960 ||: 74%|#######3 | 70/95 [00:52<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0846, UAS: 0.1186, LAS: 0.0248, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.3256, partial_loss/deprel_loss: 6.6774, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6964, loss: 11.2984, batch_reg_loss: 0.0893, reg_loss: 0.0957 ||: 77%|#######6 | 73/95 [00:55<00:16, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0833, UAS: 0.1243, LAS: 0.0270, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0066, partial_loss/deprel_loss: 6.5017, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4915, loss: 11.1237, batch_reg_loss: 0.0888, reg_loss: 0.0954 ||: 80%|######## | 76/95 [00:57<00:15, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0703, UAS: 0.1299, LAS: 0.0293, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.8032, partial_loss/deprel_loss: 7.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2538, loss: 10.9525, batch_reg_loss: 0.0882, reg_loss: 0.0951 ||: 84%|########4 | 80/95 [01:00<00:11, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1558, UAS: 0.1366, LAS: 0.0323, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8053, partial_loss/deprel_loss: 4.8429, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7231, loss: 10.7869, batch_reg_loss: 0.0878, reg_loss: 0.0948 ||: 87%|########7 | 83/95 [01:02<00:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0715, UAS: 0.1407, LAS: 0.0338, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.0259, partial_loss/deprel_loss: 7.7293, partial_loss/cycle_loss: 0.0000, batch_loss: 7.6759, loss: 10.6741, batch_reg_loss: 0.0873, reg_loss: 0.0946 ||: 91%|######### | 86/95 [01:05<00:06, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2157, UAS: 0.1479, LAS: 0.0369, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3231, partial_loss/deprel_loss: 3.5750, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4113, loss: 10.5203, batch_reg_loss: 0.0867, reg_loss: 0.0942 ||: 95%|#########4| 90/95 [01:07<00:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1474, UAS: 0.1547, LAS: 0.0400, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0826, partial_loss/deprel_loss: 5.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2025, loss: 10.3609, batch_reg_loss: 0.0862, reg_loss: 0.0939 ||: 99%|#########8| 94/95 [01:10<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0841, UAS: 0.1557, LAS: 0.0404, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5016, partial_loss/deprel_loss: 7.9801, partial_loss/cycle_loss: 0.0000, batch_loss: 7.9705, loss: 10.3357, batch_reg_loss: 0.0860, reg_loss: 0.0938 ||: 100%|##########| 95/95 [01:11<00:00, 1.33it/s]\n", + "2023-04-06 22:50:47,786 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0548, UAS: 0.2285, LAS: 0.0729, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1434, partial_loss/deprel_loss: 20.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5534, loss: 17.4393, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:12, 1.35s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2127, UAS: 0.3238, LAS: 0.1315, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1571, partial_loss/deprel_loss: 10.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4327, loss: 13.8287, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:04<00:08, 1.25s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1265, UAS: 0.3078, LAS: 0.1205, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1798, partial_loss/deprel_loss: 12.8523, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5178, loss: 14.0520, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:06<00:05, 1.20s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2520, UAS: 0.3285, LAS: 0.1346, UEM: 0.0024, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5845, partial_loss/deprel_loss: 9.4003, partial_loss/cycle_loss: 0.0000, batch_loss: 8.2371, loss: 13.1916, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:09<00:03, 1.18s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1437, UAS: 0.3256, LAS: 0.1316, UEM: 0.0020, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5130, partial_loss/deprel_loss: 13.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6074, loss: 13.1748, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:11<00:01, 1.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3640, UAS: 0.3546, LAS: 0.1527, UEM: 0.0525, LEM: 0.0098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4938, partial_loss/deprel_loss: 6.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8929, loss: 12.5128, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:13<00:00, 1.27s/it] \n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - reg_loss | 0.094 | 0.000\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - UEM | 0.000 | 0.052\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - LEM | 0.000 | 0.010\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EM | 0.084 | 0.364\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 7.502 | 2.494\n", + "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - UAS | 0.156 | 0.355\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6412.477 | N/A\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 7.980 | 6.743\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - loss | 10.336 | 12.513\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - LAS | 0.040 | 0.153\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 1397.910 | N/A\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:01,761 - INFO - combo.training.trainer - Epoch duration: 0:01:25.561854\n", + "2023-04-06 22:51:01,761 - INFO - combo.training.trainer - Estimated training time remaining: 9:28:59\n", + "2023-04-06 22:51:01,761 - INFO - allennlp.training.trainer - Epoch 1/399\n", + "2023-04-06 22:51:01,762 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:51:01,762 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:51:01,769 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0892, UAS: 0.3088, LAS: 0.1046, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.4360, partial_loss/deprel_loss: 7.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3119, loss: 7.2408, batch_reg_loss: 0.0855, reg_loss: 0.0857 ||: 4%|4 | 4/95 [00:02<00:53, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1269, UAS: 0.3102, LAS: 0.1127, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.4805, partial_loss/deprel_loss: 6.2504, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1813, loss: 7.0525, batch_reg_loss: 0.0849, reg_loss: 0.0854 ||: 8%|8 | 8/95 [00:04<00:50, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3090, UAS: 0.3354, LAS: 0.1310, UEM: 0.0049, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2528, partial_loss/deprel_loss: 3.8317, partial_loss/cycle_loss: 0.0000, batch_loss: 3.6003, loss: 6.8078, batch_reg_loss: 0.0844, reg_loss: 0.0851 ||: 13%|#2 | 12/95 [00:07<00:49, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1101, UAS: 0.3157, LAS: 0.1218, UEM: 0.0043, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.7482, partial_loss/deprel_loss: 7.9708, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0102, loss: 7.3046, batch_reg_loss: 0.0839, reg_loss: 0.0849 ||: 17%|#6 | 16/95 [00:09<00:47, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2304, UAS: 0.3321, LAS: 0.1318, UEM: 0.0033, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3571, partial_loss/deprel_loss: 4.9808, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7394, loss: 7.0827, batch_reg_loss: 0.0834, reg_loss: 0.0846 ||: 21%|##1 | 20/95 [00:12<00:46, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2079, UAS: 0.3461, LAS: 0.1419, UEM: 0.0027, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4135, partial_loss/deprel_loss: 4.8411, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6384, loss: 6.8631, batch_reg_loss: 0.0828, reg_loss: 0.0844 ||: 25%|##5 | 24/95 [00:14<00:44, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1619, UAS: 0.3568, LAS: 0.1503, UEM: 0.0023, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0594, partial_loss/deprel_loss: 7.0292, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9176, loss: 6.7511, batch_reg_loss: 0.0823, reg_loss: 0.0841 ||: 29%|##9 | 28/95 [00:17<00:41, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3035, UAS: 0.3679, LAS: 0.1575, UEM: 0.0038, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5356, partial_loss/deprel_loss: 4.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8104, loss: 6.6715, batch_reg_loss: 0.0818, reg_loss: 0.0838 ||: 34%|###3 | 32/95 [00:19<00:37, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3353, UAS: 0.3790, LAS: 0.1674, UEM: 0.0040, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5441, partial_loss/deprel_loss: 4.1055, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8744, loss: 6.6041, batch_reg_loss: 0.0812, reg_loss: 0.0835 ||: 39%|###8 | 37/95 [00:22<00:33, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3046, UAS: 0.3860, LAS: 0.1749, UEM: 0.0036, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0900, partial_loss/deprel_loss: 4.5535, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3415, loss: 6.5507, batch_reg_loss: 0.0807, reg_loss: 0.0832 ||: 43%|####3 | 41/95 [00:24<00:31, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2472, UAS: 0.3908, LAS: 0.1796, UEM: 0.0034, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3257, partial_loss/deprel_loss: 5.5917, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4187, loss: 6.5291, batch_reg_loss: 0.0802, reg_loss: 0.0830 ||: 47%|####7 | 45/95 [00:26<00:29, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3365, UAS: 0.4054, LAS: 0.1916, UEM: 0.0070, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9531, partial_loss/deprel_loss: 4.3089, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1175, loss: 6.3710, batch_reg_loss: 0.0797, reg_loss: 0.0827 ||: 52%|#####1 | 49/95 [00:29<00:26, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2627, UAS: 0.4168, LAS: 0.2021, UEM: 0.0088, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9681, partial_loss/deprel_loss: 5.8151, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7249, loss: 6.2517, batch_reg_loss: 0.0792, reg_loss: 0.0825 ||: 56%|#####5 | 53/95 [00:31<00:25, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3356, UAS: 0.4249, LAS: 0.2092, UEM: 0.0083, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5951, partial_loss/deprel_loss: 4.9067, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7231, loss: 6.1661, batch_reg_loss: 0.0787, reg_loss: 0.0822 ||: 60%|###### | 57/95 [00:34<00:24, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3085, UAS: 0.4378, LAS: 0.2220, UEM: 0.0282, LEM: 0.0019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5148, partial_loss/deprel_loss: 5.2129, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1516, loss: 6.0099, batch_reg_loss: 0.0783, reg_loss: 0.0820 ||: 64%|######4 | 61/95 [00:37<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2475, UAS: 0.4450, LAS: 0.2287, UEM: 0.0392, LEM: 0.0028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.9321, partial_loss/deprel_loss: 6.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4955, loss: 5.9507, batch_reg_loss: 0.0779, reg_loss: 0.0818 ||: 67%|######7 | 64/95 [00:39<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3958, UAS: 0.4495, LAS: 0.2332, UEM: 0.0377, LEM: 0.0027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1590, partial_loss/deprel_loss: 4.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1724, loss: 5.9121, batch_reg_loss: 0.0776, reg_loss: 0.0816 ||: 71%|####### | 67/95 [00:41<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2506, UAS: 0.4516, LAS: 0.2357, UEM: 0.0367, LEM: 0.0026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.5986, partial_loss/deprel_loss: 6.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5810, loss: 5.9082, batch_reg_loss: 0.0773, reg_loss: 0.0814 ||: 74%|#######3 | 70/95 [00:43<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2938, UAS: 0.4553, LAS: 0.2401, UEM: 0.0377, LEM: 0.0027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.9417, partial_loss/deprel_loss: 6.1287, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1683, loss: 5.8802, batch_reg_loss: 0.0770, reg_loss: 0.0813 ||: 77%|#######6 | 73/95 [00:46<00:15, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3746, UAS: 0.4615, LAS: 0.2468, UEM: 0.0361, LEM: 0.0025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0424, partial_loss/deprel_loss: 4.8777, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7872, loss: 5.8175, batch_reg_loss: 0.0765, reg_loss: 0.0810 ||: 81%|########1 | 77/95 [00:48<00:12, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6636, UAS: 0.4715, LAS: 0.2577, UEM: 0.0619, LEM: 0.0139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5887, partial_loss/deprel_loss: 1.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2757, loss: 5.7031, batch_reg_loss: 0.0762, reg_loss: 0.0808 ||: 84%|########4 | 80/95 [00:51<00:11, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4942, UAS: 0.4770, LAS: 0.2646, UEM: 0.0600, LEM: 0.0134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5109, partial_loss/deprel_loss: 3.5031, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3806, loss: 5.6570, batch_reg_loss: 0.0759, reg_loss: 0.0806 ||: 88%|########8 | 84/95 [00:54<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3159, UAS: 0.4840, LAS: 0.2728, UEM: 0.0585, LEM: 0.0128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1182, partial_loss/deprel_loss: 5.8656, partial_loss/cycle_loss: 0.0000, batch_loss: 5.9916, loss: 5.5923, batch_reg_loss: 0.0755, reg_loss: 0.0804 ||: 93%|#########2| 88/95 [00:56<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4646, UAS: 0.4886, LAS: 0.2786, UEM: 0.0570, LEM: 0.0125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0568, partial_loss/deprel_loss: 3.9986, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8854, loss: 5.5646, batch_reg_loss: 0.0752, reg_loss: 0.0802 ||: 97%|#########6| 92/95 [00:58<00:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6402, UAS: 0.4963, LAS: 0.2871, UEM: 0.0600, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1759, partial_loss/deprel_loss: 2.2577, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1162, loss: 5.4829, batch_reg_loss: 0.0749, reg_loss: 0.0800 ||: 100%|##########| 95/95 [01:00<00:00, 1.56it/s]\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - reg_loss | 0.080 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - UEM | 0.060 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - LEM | 0.013 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EM | 0.640 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.176 | N/A\n", + "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - UAS | 0.496 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 2.258 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - loss | 5.483 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - LAS | 0.287 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.722 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:02,567 - INFO - combo.training.trainer - Epoch duration: 0:01:00.805524\n", + "2023-04-06 22:52:02,567 - INFO - combo.training.trainer - Estimated training time remaining: 8:05:27\n", + "2023-04-06 22:52:02,567 - INFO - allennlp.training.trainer - Epoch 2/399\n", + "2023-04-06 22:52:02,567 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:52:02,568 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:52:02,574 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5070, UAS: 0.6220, LAS: 0.4480, UEM: 0.0040, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7143, partial_loss/deprel_loss: 3.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4460, loss: 4.2797, batch_reg_loss: 0.0746, reg_loss: 0.0747 ||: 4%|4 | 4/95 [00:02<00:57, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5354, UAS: 0.6512, LAS: 0.4740, UEM: 0.0028, LEM: 0.0009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6557, partial_loss/deprel_loss: 3.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3891, loss: 3.9798, batch_reg_loss: 0.0743, reg_loss: 0.0745 ||: 8%|8 | 8/95 [00:05<00:54, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5451, UAS: 0.6686, LAS: 0.4905, UEM: 0.0285, LEM: 0.0017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3370, partial_loss/deprel_loss: 3.2024, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1032, loss: 3.8055, batch_reg_loss: 0.0739, reg_loss: 0.0744 ||: 13%|#2 | 12/95 [00:07<00:53, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3732, UAS: 0.6592, LAS: 0.4869, UEM: 0.0549, LEM: 0.0066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0546, partial_loss/deprel_loss: 5.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5687, loss: 3.9035, batch_reg_loss: 0.0737, reg_loss: 0.0743 ||: 16%|#5 | 15/95 [00:09<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5262, UAS: 0.6727, LAS: 0.4998, UEM: 0.0628, LEM: 0.0070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6727, partial_loss/deprel_loss: 3.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3465, loss: 3.7405, batch_reg_loss: 0.0735, reg_loss: 0.0741 ||: 19%|#8 | 18/95 [00:12<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6196, UAS: 0.6788, LAS: 0.5066, UEM: 0.0849, LEM: 0.0087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5574, partial_loss/deprel_loss: 2.5821, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4504, loss: 3.6848, batch_reg_loss: 0.0733, reg_loss: 0.0740 ||: 22%|##2 | 21/95 [00:14<00:52, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4468, UAS: 0.6777, LAS: 0.5063, UEM: 0.0764, LEM: 0.0079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3180, partial_loss/deprel_loss: 4.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5005, loss: 3.6993, batch_reg_loss: 0.0731, reg_loss: 0.0739 ||: 25%|##5 | 24/95 [00:16<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6454, UAS: 0.6869, LAS: 0.5163, UEM: 0.0824, LEM: 0.0090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3747, partial_loss/deprel_loss: 2.2014, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1089, loss: 3.5795, batch_reg_loss: 0.0729, reg_loss: 0.0738 ||: 28%|##8 | 27/95 [00:18<00:48, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6744, UAS: 0.6970, LAS: 0.5267, UEM: 0.2029, LEM: 0.0663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8321, partial_loss/deprel_loss: 1.8400, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7111, loss: 3.4778, batch_reg_loss: 0.0727, reg_loss: 0.0737 ||: 32%|###1 | 30/95 [00:21<00:50, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4503, UAS: 0.6922, LAS: 0.5225, UEM: 0.1897, LEM: 0.0620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.6911, partial_loss/deprel_loss: 4.8424, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8846, loss: 3.5555, batch_reg_loss: 0.0724, reg_loss: 0.0736 ||: 36%|###5 | 34/95 [00:24<00:44, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6986, UAS: 0.7002, LAS: 0.5305, UEM: 0.2109, LEM: 0.0621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6816, partial_loss/deprel_loss: 1.6548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5324, loss: 3.4693, batch_reg_loss: 0.0723, reg_loss: 0.0735 ||: 39%|###8 | 37/95 [00:26<00:44, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5281, UAS: 0.7007, LAS: 0.5313, UEM: 0.1987, LEM: 0.0581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2648, partial_loss/deprel_loss: 3.6513, partial_loss/cycle_loss: 0.0000, batch_loss: 3.6460, loss: 3.4727, batch_reg_loss: 0.0720, reg_loss: 0.0733 ||: 43%|####3 | 41/95 [00:29<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4741, UAS: 0.6962, LAS: 0.5273, UEM: 0.1924, LEM: 0.0563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4164, partial_loss/deprel_loss: 4.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4855, loss: 3.5359, batch_reg_loss: 0.0718, reg_loss: 0.0732 ||: 46%|####6 | 44/95 [00:31<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5552, UAS: 0.6990, LAS: 0.5305, UEM: 0.1911, LEM: 0.0544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7836, partial_loss/deprel_loss: 3.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3059, loss: 3.5092, batch_reg_loss: 0.0717, reg_loss: 0.0731 ||: 49%|####9 | 47/95 [00:33<00:35, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7089, UAS: 0.7034, LAS: 0.5355, UEM: 0.1959, LEM: 0.0544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 1.7523, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6374, loss: 3.4603, batch_reg_loss: 0.0715, reg_loss: 0.0730 ||: 53%|#####2 | 50/95 [00:35<00:34, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5674, UAS: 0.7029, LAS: 0.5355, UEM: 0.1889, LEM: 0.0524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8019, partial_loss/deprel_loss: 3.3643, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3231, loss: 3.4721, batch_reg_loss: 0.0713, reg_loss: 0.0729 ||: 56%|#####5 | 53/95 [00:37<00:30, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4533, UAS: 0.7061, LAS: 0.5395, UEM: 0.1821, LEM: 0.0493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9593, partial_loss/deprel_loss: 4.6140, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7542, loss: 3.4339, batch_reg_loss: 0.0711, reg_loss: 0.0728 ||: 60%|###### | 57/95 [00:40<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6635, UAS: 0.7108, LAS: 0.5443, UEM: 0.1847, LEM: 0.0478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3704, partial_loss/deprel_loss: 2.2964, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1821, loss: 3.3868, batch_reg_loss: 0.0709, reg_loss: 0.0727 ||: 64%|######4 | 61/95 [00:42<00:22, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5675, UAS: 0.7133, LAS: 0.5472, UEM: 0.1795, LEM: 0.0456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8984, partial_loss/deprel_loss: 3.5634, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5010, loss: 3.3671, batch_reg_loss: 0.0707, reg_loss: 0.0726 ||: 68%|######8 | 65/95 [00:45<00:20, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6256, UAS: 0.7172, LAS: 0.5516, UEM: 0.1924, LEM: 0.0494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9098, partial_loss/deprel_loss: 2.6757, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5930, loss: 3.3262, batch_reg_loss: 0.0705, reg_loss: 0.0725 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6834, UAS: 0.7184, LAS: 0.5535, UEM: 0.1973, LEM: 0.0488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1975, partial_loss/deprel_loss: 2.0961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9867, loss: 3.3143, batch_reg_loss: 0.0704, reg_loss: 0.0724 ||: 75%|#######4 | 71/95 [00:49<00:17, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5457, UAS: 0.7191, LAS: 0.5544, UEM: 0.1902, LEM: 0.0470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2685, partial_loss/deprel_loss: 3.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7424, loss: 3.3121, batch_reg_loss: 0.0702, reg_loss: 0.0723 ||: 79%|#######8 | 75/95 [00:52<00:13, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4441, UAS: 0.7213, LAS: 0.5570, UEM: 0.1863, LEM: 0.0451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3762, partial_loss/deprel_loss: 4.7015, partial_loss/cycle_loss: 0.0000, batch_loss: 4.9064, loss: 3.2949, batch_reg_loss: 0.0700, reg_loss: 0.0722 ||: 83%|########3 | 79/95 [00:54<00:10, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7161, UAS: 0.7224, LAS: 0.5588, UEM: 0.1833, LEM: 0.0441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0918, partial_loss/deprel_loss: 1.9270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8298, loss: 3.2891, batch_reg_loss: 0.0698, reg_loss: 0.0721 ||: 87%|########7 | 83/95 [00:57<00:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5738, UAS: 0.7242, LAS: 0.5609, UEM: 0.1823, LEM: 0.0430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8083, partial_loss/deprel_loss: 3.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3436, loss: 3.2741, batch_reg_loss: 0.0696, reg_loss: 0.0720 ||: 92%|#########1| 87/95 [01:00<00:05, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6708, UAS: 0.7295, LAS: 0.5668, UEM: 0.2018, LEM: 0.0497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4738, partial_loss/deprel_loss: 2.0978, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0424, loss: 3.2064, batch_reg_loss: 0.0694, reg_loss: 0.0718 ||: 96%|#########5| 91/95 [01:03<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7269, UAS: 0.7333, LAS: 0.5708, UEM: 0.2004, LEM: 0.0483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9830, partial_loss/deprel_loss: 1.8156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7183, loss: 3.1682, batch_reg_loss: 0.0692, reg_loss: 0.0717 ||: 100%|##########| 95/95 [01:05<00:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7269, UAS: 0.7333, LAS: 0.5708, UEM: 0.2004, LEM: 0.0483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9830, partial_loss/deprel_loss: 1.8156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7183, loss: 3.1682, batch_reg_loss: 0.0692, reg_loss: 0.0717 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-06 22:53:08,051 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - reg_loss | 0.072 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UEM | 0.200 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - LEM | 0.048 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EM | 0.727 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.983 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UAS | 0.733 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.816 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - loss | 3.168 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - LAS | 0.571 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.722 | N/A\n", + "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.trainer - Epoch duration: 0:01:05.486109\n", + "2023-04-06 22:53:08,053 - INFO - combo.training.trainer - Estimated training time remaining: 7:47:15\n", + "2023-04-06 22:53:08,053 - INFO - allennlp.training.trainer - Epoch 3/399\n", + "2023-04-06 22:53:08,054 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:53:08,054 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:53:08,060 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6676, UAS: 0.8632, LAS: 0.7232, UEM: 0.4714, LEM: 0.1227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6770, partial_loss/deprel_loss: 2.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2223, loss: 1.6806, batch_reg_loss: 0.0691, reg_loss: 0.0691 ||: 3%|3 | 3/95 [00:02<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6184, UAS: 0.8099, LAS: 0.6626, UEM: 0.3402, LEM: 0.0788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0338, partial_loss/deprel_loss: 2.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7803, loss: 2.3373, batch_reg_loss: 0.0689, reg_loss: 0.0690 ||: 7%|7 | 7/95 [00:04<01:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7145, UAS: 0.7989, LAS: 0.6512, UEM: 0.2798, LEM: 0.0575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0975, partial_loss/deprel_loss: 1.9117, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8176, loss: 2.4843, batch_reg_loss: 0.0687, reg_loss: 0.0689 ||: 12%|#1 | 11/95 [00:07<00:56, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7915, UAS: 0.7842, LAS: 0.6396, UEM: 0.3657, LEM: 0.1059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3674, partial_loss/deprel_loss: 1.0387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 2.6558, batch_reg_loss: 0.0686, reg_loss: 0.0689 ||: 15%|#4 | 14/95 [00:09<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6064, UAS: 0.7826, LAS: 0.6378, UEM: 0.3203, LEM: 0.0919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4228, partial_loss/deprel_loss: 2.9571, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9187, loss: 2.6608, batch_reg_loss: 0.0684, reg_loss: 0.0688 ||: 19%|#8 | 18/95 [00:11<00:51, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7368, UAS: 0.7888, LAS: 0.6459, UEM: 0.3072, LEM: 0.0861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8931, partial_loss/deprel_loss: 1.4595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4146, loss: 2.5648, batch_reg_loss: 0.0683, reg_loss: 0.0687 ||: 22%|##2 | 21/95 [00:13<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6162, UAS: 0.7853, LAS: 0.6437, UEM: 0.2928, LEM: 0.0783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5406, partial_loss/deprel_loss: 2.8730, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8748, loss: 2.5919, batch_reg_loss: 0.0682, reg_loss: 0.0687 ||: 26%|##6 | 25/95 [00:16<00:45, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7049, UAS: 0.7937, LAS: 0.6520, UEM: 0.2802, LEM: 0.0692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2069, partial_loss/deprel_loss: 1.8636, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8003, loss: 2.4999, batch_reg_loss: 0.0681, reg_loss: 0.0686 ||: 31%|### | 29/95 [00:18<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7526, UAS: 0.7956, LAS: 0.6543, UEM: 0.2755, LEM: 0.0677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9012, partial_loss/deprel_loss: 1.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4053, loss: 2.4758, batch_reg_loss: 0.0679, reg_loss: 0.0685 ||: 34%|###3 | 32/95 [00:21<00:43, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5970, UAS: 0.7955, LAS: 0.6540, UEM: 0.2638, LEM: 0.0624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9471, partial_loss/deprel_loss: 3.2983, partial_loss/cycle_loss: 0.0000, batch_loss: 3.2959, loss: 2.4902, batch_reg_loss: 0.0678, reg_loss: 0.0685 ||: 38%|###7 | 36/95 [00:23<00:39, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6423, UAS: 0.7992, LAS: 0.6577, UEM: 0.2635, LEM: 0.0610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0873, partial_loss/deprel_loss: 2.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5893, loss: 2.4497, batch_reg_loss: 0.0677, reg_loss: 0.0684 ||: 41%|####1 | 39/95 [00:25<00:38, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7397, UAS: 0.8000, LAS: 0.6588, UEM: 0.2579, LEM: 0.0586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1241, partial_loss/deprel_loss: 1.7406, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6849, loss: 2.4383, batch_reg_loss: 0.0676, reg_loss: 0.0683 ||: 44%|####4 | 42/95 [00:27<00:36, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6546, UAS: 0.8001, LAS: 0.6591, UEM: 0.2563, LEM: 0.0575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1341, partial_loss/deprel_loss: 2.6585, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6210, loss: 2.4478, batch_reg_loss: 0.0675, reg_loss: 0.0683 ||: 47%|####7 | 45/95 [00:30<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7658, UAS: 0.8053, LAS: 0.6651, UEM: 0.2685, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7582, partial_loss/deprel_loss: 1.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3638, loss: 2.3887, batch_reg_loss: 0.0673, reg_loss: 0.0682 ||: 52%|#####1 | 49/95 [00:32<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6690, UAS: 0.8032, LAS: 0.6633, UEM: 0.2763, LEM: 0.0646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8230, partial_loss/deprel_loss: 2.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4111, loss: 2.4123, batch_reg_loss: 0.0672, reg_loss: 0.0681 ||: 56%|#####5 | 53/95 [00:35<00:29, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6075, UAS: 0.8054, LAS: 0.6659, UEM: 0.3141, LEM: 0.0993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6840, partial_loss/deprel_loss: 3.1979, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1622, loss: 2.3942, batch_reg_loss: 0.0671, reg_loss: 0.0681 ||: 59%|#####8 | 56/95 [00:37<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6152, UAS: 0.8064, LAS: 0.6669, UEM: 0.3160, LEM: 0.0996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6132, partial_loss/deprel_loss: 2.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9107, loss: 2.3838, batch_reg_loss: 0.0670, reg_loss: 0.0680 ||: 62%|######2 | 59/95 [00:39<00:25, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7006, UAS: 0.8043, LAS: 0.6649, UEM: 0.3079, LEM: 0.0963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3980, partial_loss/deprel_loss: 2.0046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9501, loss: 2.4046, batch_reg_loss: 0.0669, reg_loss: 0.0680 ||: 65%|######5 | 62/95 [00:42<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7086, UAS: 0.8070, LAS: 0.6679, UEM: 0.3095, LEM: 0.0952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4375, partial_loss/deprel_loss: 2.0754, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0146, loss: 2.3713, batch_reg_loss: 0.0668, reg_loss: 0.0679 ||: 68%|######8 | 65/95 [00:44<00:21, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6813, UAS: 0.8084, LAS: 0.6699, UEM: 0.3166, LEM: 0.0989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8208, partial_loss/deprel_loss: 2.2253, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2111, loss: 2.3507, batch_reg_loss: 0.0667, reg_loss: 0.0679 ||: 72%|#######1 | 68/95 [00:46<00:19, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5871, UAS: 0.8070, LAS: 0.6691, UEM: 0.3075, LEM: 0.0954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.6979, partial_loss/deprel_loss: 3.2119, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3757, loss: 2.3629, batch_reg_loss: 0.0666, reg_loss: 0.0678 ||: 76%|#######5 | 72/95 [00:49<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7640, UAS: 0.8099, LAS: 0.6725, UEM: 0.3097, LEM: 0.0946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8809, partial_loss/deprel_loss: 1.5519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4842, loss: 2.3301, batch_reg_loss: 0.0665, reg_loss: 0.0677 ||: 79%|#######8 | 75/95 [00:51<00:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6154, UAS: 0.8082, LAS: 0.6707, UEM: 0.3018, LEM: 0.0919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9648, partial_loss/deprel_loss: 3.0318, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0848, loss: 2.3541, batch_reg_loss: 0.0664, reg_loss: 0.0677 ||: 83%|########3 | 79/95 [00:53<00:11, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7683, UAS: 0.8076, LAS: 0.6706, UEM: 0.3035, LEM: 0.0922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 1.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2159, loss: 2.3611, batch_reg_loss: 0.0662, reg_loss: 0.0676 ||: 87%|########7 | 83/95 [00:56<00:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6539, UAS: 0.8071, LAS: 0.6703, UEM: 0.2953, LEM: 0.0894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9894, partial_loss/deprel_loss: 2.5136, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4749, loss: 2.3662, batch_reg_loss: 0.0661, reg_loss: 0.0675 ||: 92%|#########1| 87/95 [00:58<00:05, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.8079, LAS: 0.6718, UEM: 0.2955, LEM: 0.0888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0825, partial_loss/deprel_loss: 1.6397, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5943, loss: 2.3576, batch_reg_loss: 0.0660, reg_loss: 0.0675 ||: 96%|#########5| 91/95 [01:02<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6631, UAS: 0.8087, LAS: 0.6729, UEM: 0.2926, LEM: 0.0870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5400, partial_loss/deprel_loss: 2.6590, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7012, loss: 2.3477, batch_reg_loss: 0.0660, reg_loss: 0.0674 ||: 99%|#########8| 94/95 [01:04<00:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7584, UAS: 0.8094, LAS: 0.6738, UEM: 0.2935, LEM: 0.0868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9615, partial_loss/deprel_loss: 1.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4326, loss: 2.3380, batch_reg_loss: 0.0659, reg_loss: 0.0674 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 22:54:13,234 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - reg_loss | 0.067 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UEM | 0.293 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - LEM | 0.087 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EM | 0.758 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.961 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UAS | 0.809 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.468 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - loss | 2.338 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - LAS | 0.674 | N/A\n", + "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.722 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.trainer - Epoch duration: 0:01:05.182956\n", + "2023-04-06 22:54:13,236 - INFO - combo.training.trainer - Estimated training time remaining: 7:37:06\n", + "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - Epoch 4/399\n", + "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 22:54:13,244 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7843, UAS: 0.8423, LAS: 0.7132, UEM: 0.2309, LEM: 0.0471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7504, partial_loss/deprel_loss: 1.3710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3127, loss: 2.0264, batch_reg_loss: 0.0659, reg_loss: 0.0659 ||: 3%|3 | 3/95 [00:02<01:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6926, UAS: 0.8477, LAS: 0.7204, UEM: 0.3100, LEM: 0.0892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8003, partial_loss/deprel_loss: 2.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2252, loss: 1.9304, batch_reg_loss: 0.0658, reg_loss: 0.0659 ||: 6%|6 | 6/95 [00:04<01:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7859, UAS: 0.8541, LAS: 0.7301, UEM: 0.3025, LEM: 0.0763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7349, partial_loss/deprel_loss: 1.3564, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2978, loss: 1.8328, batch_reg_loss: 0.0657, reg_loss: 0.0658 ||: 9%|9 | 9/95 [00:06<01:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8201, UAS: 0.8576, LAS: 0.7345, UEM: 0.3501, LEM: 0.1083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.9258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8785, loss: 1.7845, batch_reg_loss: 0.0656, reg_loss: 0.0658 ||: 14%|#3 | 13/95 [00:09<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7617, UAS: 0.8507, LAS: 0.7264, UEM: 0.3186, LEM: 0.0950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9531, partial_loss/deprel_loss: 1.5410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4890, loss: 1.8748, batch_reg_loss: 0.0656, reg_loss: 0.0657 ||: 18%|#7 | 17/95 [00:11<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6461, UAS: 0.8475, LAS: 0.7246, UEM: 0.3116, LEM: 0.0926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6654, partial_loss/deprel_loss: 2.6974, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7565, loss: 1.8976, batch_reg_loss: 0.0655, reg_loss: 0.0657 ||: 21%|##1 | 20/95 [00:14<00:53, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7139, UAS: 0.8476, LAS: 0.7244, UEM: 0.2888, LEM: 0.0847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6077, partial_loss/deprel_loss: 2.1567, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1123, loss: 1.9062, batch_reg_loss: 0.0654, reg_loss: 0.0657 ||: 24%|##4 | 23/95 [00:16<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.8514, LAS: 0.7285, UEM: 0.2895, LEM: 0.0811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9473, partial_loss/deprel_loss: 1.4645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4264, loss: 1.8600, batch_reg_loss: 0.0654, reg_loss: 0.0656 ||: 27%|##7 | 26/95 [00:18<00:50, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6262, UAS: 0.8450, LAS: 0.7213, UEM: 0.2705, LEM: 0.0746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1282, partial_loss/deprel_loss: 3.0901, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1630, loss: 1.9443, batch_reg_loss: 0.0653, reg_loss: 0.0656 ||: 32%|###1 | 30/95 [00:21<00:46, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5623, UAS: 0.8420, LAS: 0.7187, UEM: 0.2983, LEM: 0.0907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8987, partial_loss/deprel_loss: 3.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5767, loss: 1.9711, batch_reg_loss: 0.0652, reg_loss: 0.0656 ||: 35%|###4 | 33/95 [00:23<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7552, UAS: 0.8439, LAS: 0.7209, UEM: 0.2955, LEM: 0.0870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2850, partial_loss/deprel_loss: 1.7603, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7304, loss: 1.9546, batch_reg_loss: 0.0651, reg_loss: 0.0655 ||: 39%|###8 | 37/95 [00:26<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7858, UAS: 0.8456, LAS: 0.7232, UEM: 0.2993, LEM: 0.0856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7638, partial_loss/deprel_loss: 1.2336, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2048, loss: 1.9263, batch_reg_loss: 0.0651, reg_loss: 0.0655 ||: 42%|####2 | 40/95 [00:28<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6026, UAS: 0.8447, LAS: 0.7235, UEM: 0.3057, LEM: 0.0879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5938, partial_loss/deprel_loss: 2.9975, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1818, loss: 1.9216, batch_reg_loss: 0.0650, reg_loss: 0.0655 ||: 45%|####5 | 43/95 [00:30<00:37, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5178, UAS: 0.8369, LAS: 0.7161, UEM: 0.2946, LEM: 0.0839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1605, partial_loss/deprel_loss: 3.8058, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1417, loss: 2.0016, batch_reg_loss: 0.0649, reg_loss: 0.0654 ||: 49%|####9 | 47/95 [00:33<00:33, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8353, LAS: 0.7140, UEM: 0.2853, LEM: 0.0808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3310, partial_loss/deprel_loss: 1.8267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7924, loss: 2.0231, batch_reg_loss: 0.0649, reg_loss: 0.0654 ||: 53%|#####2 | 50/95 [00:35<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7935, UAS: 0.8356, LAS: 0.7142, UEM: 0.2897, LEM: 0.0806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8164, partial_loss/deprel_loss: 1.2976, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2662, loss: 2.0258, batch_reg_loss: 0.0648, reg_loss: 0.0654 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7302, UAS: 0.8354, LAS: 0.7141, UEM: 0.2827, LEM: 0.0778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4899, partial_loss/deprel_loss: 1.9265, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9039, loss: 2.0274, batch_reg_loss: 0.0648, reg_loss: 0.0653 ||: 59%|#####8 | 56/95 [00:39<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7533, UAS: 0.8385, LAS: 0.7180, UEM: 0.3088, LEM: 0.0960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3812, partial_loss/deprel_loss: 1.7436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7359, loss: 1.9906, batch_reg_loss: 0.0647, reg_loss: 0.0653 ||: 62%|######2 | 59/95 [00:41<00:26, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8078, UAS: 0.8402, LAS: 0.7202, UEM: 0.3200, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6234, partial_loss/deprel_loss: 1.1282, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0919, loss: 1.9686, batch_reg_loss: 0.0647, reg_loss: 0.0653 ||: 65%|######5 | 62/95 [00:44<00:24, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7705, UAS: 0.8412, LAS: 0.7218, UEM: 0.3186, LEM: 0.0985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0299, partial_loss/deprel_loss: 1.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4845, loss: 1.9581, batch_reg_loss: 0.0646, reg_loss: 0.0652 ||: 69%|######9 | 66/95 [00:46<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6569, UAS: 0.8412, LAS: 0.7219, UEM: 0.3170, LEM: 0.0974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6073, partial_loss/deprel_loss: 2.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7116, loss: 1.9593, batch_reg_loss: 0.0646, reg_loss: 0.0652 ||: 73%|#######2 | 69/95 [00:48<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7088, UAS: 0.8419, LAS: 0.7232, UEM: 0.3224, LEM: 0.1000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8421, partial_loss/deprel_loss: 2.0728, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0911, loss: 1.9493, batch_reg_loss: 0.0645, reg_loss: 0.0652 ||: 77%|#######6 | 73/95 [00:51<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.8427, LAS: 0.7244, UEM: 0.3220, LEM: 0.0990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1610, partial_loss/deprel_loss: 1.5024, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4986, loss: 1.9372, batch_reg_loss: 0.0645, reg_loss: 0.0651 ||: 80%|######## | 76/95 [00:53<00:12, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7085, UAS: 0.8434, LAS: 0.7254, UEM: 0.3490, LEM: 0.1270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7673, partial_loss/deprel_loss: 2.1132, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1084, loss: 1.9316, batch_reg_loss: 0.0644, reg_loss: 0.0651 ||: 83%|########3 | 79/95 [00:55<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8151, UAS: 0.8439, LAS: 0.7262, UEM: 0.3482, LEM: 0.1258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4797, partial_loss/deprel_loss: 1.0876, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0303, loss: 1.9255, batch_reg_loss: 0.0643, reg_loss: 0.0651 ||: 87%|########7 | 83/95 [00:58<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7979, UAS: 0.8448, LAS: 0.7271, UEM: 0.3537, LEM: 0.1279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7547, partial_loss/deprel_loss: 1.3058, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2599, loss: 1.9150, batch_reg_loss: 0.0643, reg_loss: 0.0650 ||: 91%|######### | 86/95 [01:00<00:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7795, UAS: 0.8455, LAS: 0.7279, UEM: 0.3476, LEM: 0.1250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0215, partial_loss/deprel_loss: 1.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4521, loss: 1.9097, batch_reg_loss: 0.0643, reg_loss: 0.0650 ||: 94%|#########3| 89/95 [01:02<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7703, UAS: 0.8448, LAS: 0.7275, UEM: 0.3426, LEM: 0.1220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0980, partial_loss/deprel_loss: 1.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4857, loss: 1.9164, batch_reg_loss: 0.0642, reg_loss: 0.0650 ||: 98%|#########7| 93/95 [01:05<00:01, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8175, UAS: 0.8456, LAS: 0.7284, UEM: 0.3446, LEM: 0.1221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5265, partial_loss/deprel_loss: 1.0597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0172, loss: 1.9074, batch_reg_loss: 0.0642, reg_loss: 0.0650 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-06 22:55:19,632 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - reg_loss | 0.065 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UEM | 0.345 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - LEM | 0.122 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EM | 0.817 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.526 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UAS | 0.846 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.060 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - loss | 1.907 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - LAS | 0.728 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.722 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:19,634 - INFO - combo.training.trainer - Epoch duration: 0:01:06.397867\n", + "2023-04-06 22:55:19,635 - INFO - combo.training.trainer - Estimated training time remaining: 7:32:11\n", + "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - Epoch 5/399\n", + "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:55:19,642 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7362, UAS: 0.8409, LAS: 0.7299, UEM: 0.1639, LEM: 0.0250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5391, partial_loss/deprel_loss: 1.9122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9017, loss: 1.9255, batch_reg_loss: 0.0641, reg_loss: 0.0642 ||: 3%|3 | 3/95 [00:02<01:11, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7690, UAS: 0.8589, LAS: 0.7505, UEM: 0.2830, LEM: 0.0794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1920, partial_loss/deprel_loss: 1.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5425, loss: 1.7310, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||: 6%|6 | 6/95 [00:04<01:07, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.8832, LAS: 0.7762, UEM: 0.4822, LEM: 0.1763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3430, partial_loss/deprel_loss: 0.8381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 1.4723, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||: 9%|9 | 9/95 [00:06<01:05, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7172, UAS: 0.8691, LAS: 0.7610, UEM: 0.4246, LEM: 0.1533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8046, partial_loss/deprel_loss: 1.9388, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9760, loss: 1.6106, batch_reg_loss: 0.0640, reg_loss: 0.0641 ||: 14%|#3 | 13/95 [00:09<00:59, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6100, UAS: 0.8599, LAS: 0.7513, UEM: 0.3860, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4556, partial_loss/deprel_loss: 2.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0833, loss: 1.7038, batch_reg_loss: 0.0640, reg_loss: 0.0641 ||: 17%|#6 | 16/95 [00:11<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6830, UAS: 0.8635, LAS: 0.7553, UEM: 0.4120, LEM: 0.1493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1722, partial_loss/deprel_loss: 2.3345, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3660, loss: 1.6729, batch_reg_loss: 0.0639, reg_loss: 0.0641 ||: 20%|## | 19/95 [00:13<00:56, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8055, UAS: 0.8630, LAS: 0.7545, UEM: 0.3829, LEM: 0.1339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8116, partial_loss/deprel_loss: 1.2710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2430, loss: 1.6813, batch_reg_loss: 0.0639, reg_loss: 0.0640 ||: 24%|##4 | 23/95 [00:16<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7791, UAS: 0.8597, LAS: 0.7516, UEM: 0.3563, LEM: 0.1215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9777, partial_loss/deprel_loss: 1.4278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4016, loss: 1.7203, batch_reg_loss: 0.0639, reg_loss: 0.0640 ||: 28%|##8 | 27/95 [00:18<00:45, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.8656, LAS: 0.7593, UEM: 0.4287, LEM: 0.1921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6121, partial_loss/deprel_loss: 0.9983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9849, loss: 1.6482, batch_reg_loss: 0.0638, reg_loss: 0.0640 ||: 32%|###1 | 30/95 [00:21<00:46, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7071, UAS: 0.8680, LAS: 0.7625, UEM: 0.4650, LEM: 0.2164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0660, partial_loss/deprel_loss: 2.1342, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1843, loss: 1.6122, batch_reg_loss: 0.0638, reg_loss: 0.0640 ||: 35%|###4 | 33/95 [00:23<00:46, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7614, UAS: 0.8645, LAS: 0.7587, UEM: 0.4402, LEM: 0.2026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2990, partial_loss/deprel_loss: 1.6074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6095, loss: 1.6531, batch_reg_loss: 0.0637, reg_loss: 0.0640 ||: 39%|###8 | 37/95 [00:26<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6848, UAS: 0.8611, LAS: 0.7551, UEM: 0.4345, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6570, partial_loss/deprel_loss: 2.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5164, loss: 1.6897, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||: 43%|####3 | 41/95 [00:28<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7787, UAS: 0.8584, LAS: 0.7522, UEM: 0.4205, LEM: 0.1885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0538, partial_loss/deprel_loss: 1.4761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4553, loss: 1.7256, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||: 47%|####7 | 45/95 [00:31<00:33, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8132, UAS: 0.8591, LAS: 0.7532, UEM: 0.4148, LEM: 0.1806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8750, partial_loss/deprel_loss: 1.2898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2705, loss: 1.7183, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||: 52%|#####1 | 49/95 [00:33<00:30, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7496, UAS: 0.8582, LAS: 0.7519, UEM: 0.4014, LEM: 0.1722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3200, partial_loss/deprel_loss: 1.7153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6999, loss: 1.7334, batch_reg_loss: 0.0636, reg_loss: 0.0639 ||: 56%|#####5 | 53/95 [00:36<00:27, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6925, UAS: 0.8586, LAS: 0.7525, UEM: 0.4015, LEM: 0.1710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3983, partial_loss/deprel_loss: 2.4521, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5049, loss: 1.7337, batch_reg_loss: 0.0636, reg_loss: 0.0639 ||: 60%|###### | 57/95 [00:39<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7734, UAS: 0.8588, LAS: 0.7527, UEM: 0.3885, LEM: 0.1633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1734, partial_loss/deprel_loss: 1.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5771, loss: 1.7317, batch_reg_loss: 0.0636, reg_loss: 0.0638 ||: 64%|######4 | 61/95 [00:41<00:22, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.8617, LAS: 0.7560, UEM: 0.3955, LEM: 0.1630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5772, partial_loss/deprel_loss: 0.9634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9498, loss: 1.6978, batch_reg_loss: 0.0636, reg_loss: 0.0638 ||: 68%|######8 | 65/95 [00:44<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6948, UAS: 0.8627, LAS: 0.7569, UEM: 0.4035, LEM: 0.1681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5275, partial_loss/deprel_loss: 2.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5289, loss: 1.6927, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8050, UAS: 0.8632, LAS: 0.7576, UEM: 0.3997, LEM: 0.1647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7576, partial_loss/deprel_loss: 1.1395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1266, loss: 1.6848, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||: 75%|#######4 | 71/95 [00:49<00:17, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.8658, LAS: 0.7608, UEM: 0.4055, LEM: 0.1652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.9915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9802, loss: 1.6526, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||: 79%|#######8 | 75/95 [00:52<00:14, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7611, UAS: 0.8631, LAS: 0.7583, UEM: 0.3988, LEM: 0.1623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3472, partial_loss/deprel_loss: 1.7179, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7072, loss: 1.6814, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||: 82%|########2 | 78/95 [00:54<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8106, UAS: 0.8635, LAS: 0.7589, UEM: 0.3952, LEM: 0.1594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7722, partial_loss/deprel_loss: 1.0976, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0960, loss: 1.6750, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||: 85%|########5 | 81/95 [00:56<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7472, UAS: 0.8634, LAS: 0.7587, UEM: 0.3876, LEM: 0.1554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4159, partial_loss/deprel_loss: 1.8051, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7907, loss: 1.6768, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 88%|########8 | 84/95 [00:58<00:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8146, UAS: 0.8635, LAS: 0.7590, UEM: 0.3890, LEM: 0.1548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7390, partial_loss/deprel_loss: 1.1997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1710, loss: 1.6739, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 92%|#########1| 87/95 [01:00<00:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.8644, LAS: 0.7604, UEM: 0.3879, LEM: 0.1527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.9408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9357, loss: 1.6605, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 96%|#########5| 91/95 [01:03<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.8655, LAS: 0.7616, UEM: 0.3865, LEM: 0.1504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.9392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9155, loss: 1.6492, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 99%|#########8| 94/95 [01:05<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7393, UAS: 0.8654, LAS: 0.7613, UEM: 0.3842, LEM: 0.1492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3101, partial_loss/deprel_loss: 1.8342, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7927, loss: 1.6507, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-06 22:56:25,630 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7846, UAS: 0.9080, LAS: 0.8175, UEM: 0.4009, LEM: 0.1300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2796, partial_loss/deprel_loss: 39.2859, partial_loss/cycle_loss: 0.0000, batch_loss: 31.6847, loss: 23.2949, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9219, LAS: 0.8351, UEM: 0.5020, LEM: 0.1876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5392, partial_loss/deprel_loss: 25.7007, partial_loss/cycle_loss: 0.0000, batch_loss: 20.6684, loss: 21.8143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7895, UAS: 0.9238, LAS: 0.8396, UEM: 0.5798, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4669, partial_loss/deprel_loss: 43.6367, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2028, loss: 22.2369, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7461, UAS: 0.9152, LAS: 0.8299, UEM: 0.5427, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0760, partial_loss/deprel_loss: 51.1684, partial_loss/cycle_loss: 0.0000, batch_loss: 41.3499, loss: 23.5376, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - reg_loss | 0.064 | 0.000\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - UEM | 0.384 | 0.543\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - LEM | 0.149 | 0.247\n", + "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EM | 0.739 | 0.746\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.310 | 2.076\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - UAS | 0.865 | 0.915\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.834 | 51.168\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - loss | 1.651 | 23.538\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - LAS | 0.761 | 0.830\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.722 | N/A\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 22:56:36,167 - INFO - combo.training.trainer - Epoch duration: 0:01:16.532214\n", + "2023-04-06 22:56:36,167 - INFO - combo.training.trainer - Estimated training time remaining: 7:39:37\n", + "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - Epoch 6/399\n", + "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:56:36,173 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8139, UAS: 0.8852, LAS: 0.7845, UEM: 0.4318, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7961, partial_loss/deprel_loss: 1.2270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2042, loss: 1.4337, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||: 4%|4 | 4/95 [00:02<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7204, UAS: 0.8715, LAS: 0.7707, UEM: 0.3227, LEM: 0.1179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0650, partial_loss/deprel_loss: 2.0459, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1131, loss: 1.5804, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||: 7%|7 | 7/95 [00:05<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8260, UAS: 0.8775, LAS: 0.7779, UEM: 0.3232, LEM: 0.1062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7638, partial_loss/deprel_loss: 1.1360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1249, loss: 1.5147, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||: 11%|# | 10/95 [00:07<00:59, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7200, UAS: 0.8655, LAS: 0.7663, UEM: 0.3436, LEM: 0.1184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1232, partial_loss/deprel_loss: 2.0626, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1381, loss: 1.6473, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||: 14%|#3 | 13/95 [00:09<01:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7778, UAS: 0.8593, LAS: 0.7603, UEM: 0.3078, LEM: 0.1035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3290, partial_loss/deprel_loss: 1.5895, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6007, loss: 1.7120, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||: 17%|#6 | 16/95 [00:12<01:00, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6399, UAS: 0.8593, LAS: 0.7595, UEM: 0.3445, LEM: 0.1216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1261, partial_loss/deprel_loss: 2.7053, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8528, loss: 1.7150, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 20%|## | 19/95 [00:14<00:56, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7184, UAS: 0.8653, LAS: 0.7650, UEM: 0.3841, LEM: 0.1386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9814, partial_loss/deprel_loss: 2.0559, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1043, loss: 1.6599, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 23%|##3 | 22/95 [00:16<00:54, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8084, UAS: 0.8685, LAS: 0.7680, UEM: 0.3554, LEM: 0.1227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9110, partial_loss/deprel_loss: 1.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2960, loss: 1.6295, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 27%|##7 | 26/95 [00:18<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8365, UAS: 0.8739, LAS: 0.7741, UEM: 0.3662, LEM: 0.1229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5057, partial_loss/deprel_loss: 0.9085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8912, loss: 1.5664, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 32%|###1 | 30/95 [00:21<00:44, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8551, UAS: 0.8775, LAS: 0.7785, UEM: 0.3891, LEM: 0.1362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3909, partial_loss/deprel_loss: 0.7925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7755, loss: 1.5217, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 35%|###4 | 33/95 [00:23<00:44, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7322, UAS: 0.8787, LAS: 0.7806, UEM: 0.4363, LEM: 0.1945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8153, partial_loss/deprel_loss: 1.9592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9937, loss: 1.5023, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 38%|###7 | 36/95 [00:25<00:43, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7980, UAS: 0.8798, LAS: 0.7821, UEM: 0.4186, LEM: 0.1809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9276, partial_loss/deprel_loss: 1.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3436, loss: 1.4864, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 42%|####2 | 40/95 [00:28<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7367, UAS: 0.8780, LAS: 0.7800, UEM: 0.4028, LEM: 0.1734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7696, partial_loss/deprel_loss: 1.8948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9331, loss: 1.5062, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 45%|####5 | 43/95 [00:30<00:35, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7507, UAS: 0.8786, LAS: 0.7810, UEM: 0.4198, LEM: 0.1913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5450, partial_loss/deprel_loss: 1.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7754, loss: 1.4948, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 48%|####8 | 46/95 [00:32<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.8789, LAS: 0.7816, UEM: 0.4310, LEM: 0.1998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2861, partial_loss/deprel_loss: 0.6546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 1.4886, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 53%|#####2 | 50/95 [00:35<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8275, UAS: 0.8791, LAS: 0.7819, UEM: 0.4291, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.8703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 1.4817, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.8779, LAS: 0.7809, UEM: 0.4186, LEM: 0.1913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7167, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0527, loss: 1.4918, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 60%|###### | 57/95 [00:39<00:25, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.8802, LAS: 0.7837, UEM: 0.4213, LEM: 0.1882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 1.0188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0213, loss: 1.4653, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 64%|######4 | 61/95 [00:42<00:22, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8187, UAS: 0.8810, LAS: 0.7847, UEM: 0.4127, LEM: 0.1803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6354, partial_loss/deprel_loss: 1.0926, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 1.4554, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 68%|######8 | 65/95 [00:45<00:20, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.8816, LAS: 0.7855, UEM: 0.4126, LEM: 0.1791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4871, partial_loss/deprel_loss: 0.9315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 1.4468, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 73%|#######2 | 69/95 [00:47<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.8789, LAS: 0.7825, UEM: 0.4021, LEM: 0.1739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5896, partial_loss/deprel_loss: 1.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8373, loss: 1.4763, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 77%|#######6 | 73/95 [00:50<00:14, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7718, UAS: 0.8752, LAS: 0.7785, UEM: 0.3939, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2170, partial_loss/deprel_loss: 1.6286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6096, loss: 1.5194, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||: 81%|########1 | 77/95 [00:52<00:11, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7139, UAS: 0.8748, LAS: 0.7783, UEM: 0.3947, LEM: 0.1693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2148, partial_loss/deprel_loss: 2.2443, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3018, loss: 1.5257, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 85%|########5 | 81/95 [00:55<00:08, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8317, UAS: 0.8772, LAS: 0.7809, UEM: 0.4104, LEM: 0.1758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 0.9438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9222, loss: 1.4992, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 89%|########9 | 85/95 [00:58<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8445, UAS: 0.8758, LAS: 0.7795, UEM: 0.4091, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.9501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9301, loss: 1.5140, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 93%|#########2| 88/95 [01:00<00:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7635, UAS: 0.8765, LAS: 0.7801, UEM: 0.4065, LEM: 0.1706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2404, partial_loss/deprel_loss: 1.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6761, loss: 1.5071, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 96%|#########5| 91/95 [01:03<00:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7174, UAS: 0.8776, LAS: 0.7814, UEM: 0.4107, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1446, partial_loss/deprel_loss: 2.0900, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1643, loss: 1.4954, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 100%|##########| 95/95 [01:05<00:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7174, UAS: 0.8776, LAS: 0.7814, UEM: 0.4107, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1446, partial_loss/deprel_loss: 2.0900, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1643, loss: 1.4954, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-06 22:57:41,968 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:57:41,968 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - reg_loss | 0.063 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UEM | 0.411 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - LEM | 0.170 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EM | 0.717 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 2.145 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UAS | 0.878 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 2.090 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - loss | 1.495 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - LAS | 0.781 | N/A\n", + "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:57:41,970 - INFO - combo.training.trainer - Epoch duration: 0:01:05.803367\n", + "2023-04-06 22:57:41,971 - INFO - combo.training.trainer - Estimated training time remaining: 7:34:32\n", + "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - Epoch 7/399\n", + "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:57:41,978 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7544, UAS: 0.8492, LAS: 0.7522, UEM: 0.0364, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5982, partial_loss/deprel_loss: 1.6971, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7408, loss: 1.7857, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||: 3%|3 | 3/95 [00:02<01:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8092, UAS: 0.8525, LAS: 0.7608, UEM: 0.2493, LEM: 0.0764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9619, partial_loss/deprel_loss: 1.2887, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2868, loss: 1.7437, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||: 6%|6 | 6/95 [00:04<01:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8765, UAS: 0.8710, LAS: 0.7817, UEM: 0.5237, LEM: 0.2864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2644, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 1.5241, batch_reg_loss: 0.0635, reg_loss: 0.0634 ||: 9%|9 | 9/95 [00:06<01:02, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.8785, LAS: 0.7900, UEM: 0.5429, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4888, partial_loss/deprel_loss: 0.8685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8561, loss: 1.4643, batch_reg_loss: 0.0635, reg_loss: 0.0634 ||: 13%|#2 | 12/95 [00:08<01:01, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7300, UAS: 0.8770, LAS: 0.7874, UEM: 0.5009, LEM: 0.2479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7910, partial_loss/deprel_loss: 1.8718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9192, loss: 1.4855, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||: 17%|#6 | 16/95 [00:11<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.8833, LAS: 0.7951, UEM: 0.5561, LEM: 0.3169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1348, partial_loss/deprel_loss: 0.3689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3856, loss: 1.4103, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||: 21%|##1 | 20/95 [00:13<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7715, UAS: 0.8874, LAS: 0.7989, UEM: 0.5485, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2845, partial_loss/deprel_loss: 1.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6074, loss: 1.3682, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||: 25%|##5 | 24/95 [00:16<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7687, UAS: 0.8862, LAS: 0.7975, UEM: 0.5455, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2891, partial_loss/deprel_loss: 1.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5598, loss: 1.3750, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||: 29%|##9 | 28/95 [00:18<00:43, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7934, UAS: 0.8880, LAS: 0.7994, UEM: 0.5226, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0129, partial_loss/deprel_loss: 1.4350, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4142, loss: 1.3573, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||: 34%|###3 | 32/95 [00:20<00:38, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8348, UAS: 0.8865, LAS: 0.7973, UEM: 0.5038, LEM: 0.2591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7337, partial_loss/deprel_loss: 1.0537, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0533, loss: 1.3775, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||: 38%|###7 | 36/95 [00:23<00:37, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7901, UAS: 0.8859, LAS: 0.7964, UEM: 0.4948, LEM: 0.2505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1651, partial_loss/deprel_loss: 1.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4428, loss: 1.3839, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||: 42%|####2 | 40/95 [00:26<00:36, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.8884, LAS: 0.7995, UEM: 0.4954, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4473, partial_loss/deprel_loss: 0.8673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8470, loss: 1.3582, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||: 46%|####6 | 44/95 [00:28<00:32, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8306, UAS: 0.8885, LAS: 0.7994, UEM: 0.4912, LEM: 0.2366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7249, partial_loss/deprel_loss: 1.0650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 1.3584, batch_reg_loss: 0.0637, reg_loss: 0.0635 ||: 51%|##### | 48/95 [00:31<00:31, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7623, UAS: 0.8889, LAS: 0.7999, UEM: 0.4876, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5943, partial_loss/deprel_loss: 1.6767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7239, loss: 1.3541, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||: 55%|#####4 | 52/95 [00:34<00:27, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.8912, LAS: 0.8026, UEM: 0.4893, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 1.3281, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||: 59%|#####8 | 56/95 [00:36<00:25, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.8917, LAS: 0.8028, UEM: 0.4824, LEM: 0.2238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4378, partial_loss/deprel_loss: 0.8147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8031, loss: 1.3214, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||: 63%|######3 | 60/95 [00:39<00:23, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.8922, LAS: 0.8035, UEM: 0.4789, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5806, partial_loss/deprel_loss: 1.0386, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0107, loss: 1.3139, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||: 67%|######7 | 64/95 [00:42<00:20, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.8920, LAS: 0.8032, UEM: 0.4758, LEM: 0.2142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6390, partial_loss/deprel_loss: 1.0286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0145, loss: 1.3176, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||: 72%|#######1 | 68/95 [00:44<00:17, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8204, UAS: 0.8900, LAS: 0.8012, UEM: 0.4661, LEM: 0.2089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9543, partial_loss/deprel_loss: 1.2122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2244, loss: 1.3393, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||: 76%|#######5 | 72/95 [00:46<00:14, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.8907, LAS: 0.8018, UEM: 0.4598, LEM: 0.2040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2010, partial_loss/deprel_loss: 1.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5190, loss: 1.3337, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||: 80%|######## | 76/95 [00:49<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.8885, LAS: 0.7995, UEM: 0.4531, LEM: 0.1996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 1.2435, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2418, loss: 1.3594, batch_reg_loss: 0.0639, reg_loss: 0.0636 ||: 84%|########4 | 80/95 [00:52<00:09, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7586, UAS: 0.8867, LAS: 0.7973, UEM: 0.4429, LEM: 0.1946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4134, partial_loss/deprel_loss: 1.8125, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7965, loss: 1.3824, batch_reg_loss: 0.0639, reg_loss: 0.0636 ||: 88%|########8 | 84/95 [00:55<00:07, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8012, UAS: 0.8867, LAS: 0.7972, UEM: 0.4449, LEM: 0.1972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1268, partial_loss/deprel_loss: 1.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3396, loss: 1.3818, batch_reg_loss: 0.0639, reg_loss: 0.0637 ||: 93%|#########2| 88/95 [00:58<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7951, UAS: 0.8871, LAS: 0.7972, UEM: 0.4409, LEM: 0.1933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9967, partial_loss/deprel_loss: 1.4019, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3849, loss: 1.3799, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||: 96%|#########5| 91/95 [01:00<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.8875, LAS: 0.7973, UEM: 0.4360, LEM: 0.1894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8249, partial_loss/deprel_loss: 1.0910, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1018, loss: 1.3791, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||: 99%|#########8| 94/95 [01:02<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7707, UAS: 0.8873, LAS: 0.7970, UEM: 0.4336, LEM: 0.1881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2738, partial_loss/deprel_loss: 1.5326, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5448, loss: 1.3809, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-06 22:58:45,366 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - reg_loss | 0.064 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UEM | 0.434 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - LEM | 0.188 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EM | 0.771 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.274 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UAS | 0.887 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.533 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - loss | 1.381 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - LAS | 0.797 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:58:45,368 - INFO - combo.training.trainer - Epoch duration: 0:01:03.397784\n", + "2023-04-06 22:58:45,369 - INFO - combo.training.trainer - Estimated training time remaining: 7:28:29\n", + "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - Epoch 8/399\n", + "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:58:45,375 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7960, UAS: 0.8766, LAS: 0.7884, UEM: 0.0867, LEM: 0.0186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1714, partial_loss/deprel_loss: 1.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4483, loss: 1.5283, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||: 3%|3 | 3/95 [00:02<01:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.8879, LAS: 0.7993, UEM: 0.2805, LEM: 0.0809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5547, partial_loss/deprel_loss: 0.9722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9528, loss: 1.3837, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||: 7%|7 | 7/95 [00:04<00:58, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.8982, LAS: 0.8128, UEM: 0.3722, LEM: 0.1342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6149, partial_loss/deprel_loss: 0.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9510, loss: 1.2616, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||: 13%|#2 | 12/95 [00:06<00:49, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8342, UAS: 0.8925, LAS: 0.8064, UEM: 0.3546, LEM: 0.1231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6295, partial_loss/deprel_loss: 0.9856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 1.3014, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||: 16%|#5 | 15/95 [00:09<00:52, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7982, UAS: 0.8977, LAS: 0.8115, UEM: 0.3777, LEM: 0.1298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8726, partial_loss/deprel_loss: 1.2775, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2607, loss: 1.2535, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||: 19%|#8 | 18/95 [00:11<00:53, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7925, UAS: 0.8982, LAS: 0.8117, UEM: 0.3924, LEM: 0.1437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1242, partial_loss/deprel_loss: 1.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4473, loss: 1.2433, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||: 22%|##2 | 21/95 [00:13<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7558, UAS: 0.8948, LAS: 0.8080, UEM: 0.3640, LEM: 0.1318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7870, partial_loss/deprel_loss: 1.7873, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8515, loss: 1.2800, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||: 26%|##6 | 25/95 [00:15<00:46, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8093, UAS: 0.8991, LAS: 0.8129, UEM: 0.4093, LEM: 0.1608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9189, partial_loss/deprel_loss: 1.2039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2112, loss: 1.2355, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||: 29%|##9 | 28/95 [00:18<00:45, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9023, LAS: 0.8164, UEM: 0.4421, LEM: 0.1855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7983, partial_loss/deprel_loss: 1.0589, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0711, loss: 1.1956, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||: 33%|###2 | 31/95 [00:20<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8526, UAS: 0.8993, LAS: 0.8138, UEM: 0.4486, LEM: 0.1915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4474, partial_loss/deprel_loss: 0.7212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7308, loss: 1.2169, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||: 36%|###5 | 34/95 [00:22<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.8992, LAS: 0.8139, UEM: 0.4544, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.8630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8515, loss: 1.2150, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||: 40%|#### | 38/95 [00:25<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8091, UAS: 0.8998, LAS: 0.8147, UEM: 0.4529, LEM: 0.1911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1905, partial_loss/deprel_loss: 1.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4105, loss: 1.2106, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||: 43%|####3 | 41/95 [00:27<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8411, UAS: 0.8994, LAS: 0.8142, UEM: 0.4556, LEM: 0.1896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.9996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9817, loss: 1.2179, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||: 47%|####7 | 45/95 [00:30<00:33, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.8983, LAS: 0.8123, UEM: 0.4424, LEM: 0.1808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6947, partial_loss/deprel_loss: 1.0266, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0247, loss: 1.2359, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||: 52%|#####1 | 49/95 [00:32<00:30, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7533, UAS: 0.8985, LAS: 0.8127, UEM: 0.4414, LEM: 0.1795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5425, partial_loss/deprel_loss: 1.5829, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6393, loss: 1.2254, batch_reg_loss: 0.0645, reg_loss: 0.0643 ||: 56%|#####5 | 53/95 [00:35<00:27, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7877, UAS: 0.8973, LAS: 0.8112, UEM: 0.4319, LEM: 0.1743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3386, partial_loss/deprel_loss: 1.4528, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4945, loss: 1.2410, batch_reg_loss: 0.0645, reg_loss: 0.0643 ||: 60%|###### | 57/95 [00:38<00:25, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.8975, LAS: 0.8113, UEM: 0.4308, LEM: 0.1737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3600, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7277, loss: 1.2418, batch_reg_loss: 0.0646, reg_loss: 0.0643 ||: 64%|######4 | 61/95 [00:40<00:22, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.8972, LAS: 0.8109, UEM: 0.4285, LEM: 0.1730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3648, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 1.2476, batch_reg_loss: 0.0646, reg_loss: 0.0643 ||: 68%|######8 | 65/95 [00:42<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.8979, LAS: 0.8122, UEM: 0.4507, LEM: 0.1927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2452, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5161, loss: 1.2376, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||: 73%|#######2 | 69/95 [00:45<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7070, UAS: 0.8969, LAS: 0.8110, UEM: 0.4422, LEM: 0.1873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3662, partial_loss/deprel_loss: 2.1813, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2830, loss: 1.2500, batch_reg_loss: 0.0647, reg_loss: 0.0644 ||: 77%|#######6 | 73/95 [00:48<00:14, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.8951, LAS: 0.8090, UEM: 0.4329, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7761, partial_loss/deprel_loss: 1.0307, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0446, loss: 1.2678, batch_reg_loss: 0.0648, reg_loss: 0.0644 ||: 81%|########1 | 77/95 [00:51<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.8959, LAS: 0.8101, UEM: 0.4385, LEM: 0.1888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7951, partial_loss/deprel_loss: 1.1140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1150, loss: 1.2612, batch_reg_loss: 0.0648, reg_loss: 0.0644 ||: 85%|########5 | 81/95 [00:54<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8287, UAS: 0.8950, LAS: 0.8088, UEM: 0.4376, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8267, partial_loss/deprel_loss: 1.1303, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1344, loss: 1.2756, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||: 89%|########9 | 85/95 [00:56<00:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8440, UAS: 0.8945, LAS: 0.8085, UEM: 0.4560, LEM: 0.2097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6894, partial_loss/deprel_loss: 0.9977, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0009, loss: 1.2818, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||: 94%|#########3| 89/95 [00:59<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.8938, LAS: 0.8077, UEM: 0.4470, LEM: 0.2044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8120, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0858, loss: 1.2908, batch_reg_loss: 0.0650, reg_loss: 0.0645 ||: 98%|#########7| 93/95 [01:01<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7516, UAS: 0.8926, LAS: 0.8065, UEM: 0.4427, LEM: 0.2025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7706, partial_loss/deprel_loss: 1.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8177, loss: 1.3028, batch_reg_loss: 0.0650, reg_loss: 0.0645 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-06 22:59:48,520 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - reg_loss | 0.064 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UEM | 0.443 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - LEM | 0.202 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EM | 0.752 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.771 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UAS | 0.893 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.748 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - loss | 1.303 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - LAS | 0.806 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.trainer - Epoch duration: 0:01:03.153713\n", + "2023-04-06 22:59:48,522 - INFO - combo.training.trainer - Estimated training time remaining: 7:23:22\n", + "2023-04-06 22:59:48,522 - INFO - allennlp.training.trainer - Epoch 9/399\n", + "2023-04-06 22:59:48,523 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 22:59:48,523 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:59:48,529 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9012, LAS: 0.8183, UEM: 0.3259, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6332, partial_loss/deprel_loss: 0.8460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8685, loss: 1.2115, batch_reg_loss: 0.0650, reg_loss: 0.0650 ||: 4%|4 | 4/95 [00:02<00:49, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8063, UAS: 0.9085, LAS: 0.8263, UEM: 0.4017, LEM: 0.1348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1179, partial_loss/deprel_loss: 1.2629, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2989, loss: 1.1239, batch_reg_loss: 0.0651, reg_loss: 0.0650 ||: 7%|7 | 7/95 [00:04<00:53, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8399, UAS: 0.8992, LAS: 0.8168, UEM: 0.3929, LEM: 0.1274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7859, partial_loss/deprel_loss: 0.9736, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0012, loss: 1.2177, batch_reg_loss: 0.0651, reg_loss: 0.0651 ||: 11%|# | 10/95 [00:06<00:55, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7336, UAS: 0.8973, LAS: 0.8147, UEM: 0.3889, LEM: 0.1248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3379, partial_loss/deprel_loss: 1.8283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9954, loss: 1.2410, batch_reg_loss: 0.0652, reg_loss: 0.0651 ||: 14%|#3 | 13/95 [00:08<00:55, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.8937, LAS: 0.8107, UEM: 0.3964, LEM: 0.1369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.7168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 1.2798, batch_reg_loss: 0.0652, reg_loss: 0.0651 ||: 17%|#6 | 16/95 [00:10<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7957, UAS: 0.8909, LAS: 0.8065, UEM: 0.3515, LEM: 0.1187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2395, partial_loss/deprel_loss: 1.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4966, loss: 1.3237, batch_reg_loss: 0.0653, reg_loss: 0.0651 ||: 21%|##1 | 20/95 [00:13<00:50, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.8905, LAS: 0.8061, UEM: 0.3490, LEM: 0.1206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4946, partial_loss/deprel_loss: 0.7930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 1.3368, batch_reg_loss: 0.0653, reg_loss: 0.0652 ||: 25%|##5 | 24/95 [00:16<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7865, UAS: 0.8863, LAS: 0.8018, UEM: 0.3213, LEM: 0.1094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5779, partial_loss/deprel_loss: 1.6368, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6904, loss: 1.3790, batch_reg_loss: 0.0654, reg_loss: 0.0652 ||: 29%|##9 | 28/95 [00:18<00:44, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.8878, LAS: 0.8028, UEM: 0.3248, LEM: 0.1124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 1.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3899, loss: 1.3691, batch_reg_loss: 0.0654, reg_loss: 0.0652 ||: 33%|###2 | 31/95 [00:21<00:43, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.8900, LAS: 0.8052, UEM: 0.3452, LEM: 0.1243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.6592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6549, loss: 1.3427, batch_reg_loss: 0.0655, reg_loss: 0.0652 ||: 37%|###6 | 35/95 [00:23<00:40, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7492, UAS: 0.8914, LAS: 0.8071, UEM: 0.3706, LEM: 0.1420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7194, partial_loss/deprel_loss: 1.7316, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7946, loss: 1.3227, batch_reg_loss: 0.0655, reg_loss: 0.0652 ||: 40%|#### | 38/95 [00:25<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7134, UAS: 0.8890, LAS: 0.8047, UEM: 0.3838, LEM: 0.1508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8345, partial_loss/deprel_loss: 2.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3944, loss: 1.3478, batch_reg_loss: 0.0656, reg_loss: 0.0653 ||: 43%|####3 | 41/95 [00:27<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8218, UAS: 0.8897, LAS: 0.8053, UEM: 0.3825, LEM: 0.1483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8915, partial_loss/deprel_loss: 1.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1439, loss: 1.3414, batch_reg_loss: 0.0656, reg_loss: 0.0653 ||: 46%|####6 | 44/95 [00:30<00:35, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.8897, LAS: 0.8056, UEM: 0.3805, LEM: 0.1461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4738, partial_loss/deprel_loss: 0.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8353, loss: 1.3372, batch_reg_loss: 0.0657, reg_loss: 0.0653 ||: 51%|##### | 48/95 [00:32<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.8916, LAS: 0.8080, UEM: 0.3958, LEM: 0.1551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5700, partial_loss/deprel_loss: 0.9175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9137, loss: 1.3151, batch_reg_loss: 0.0657, reg_loss: 0.0653 ||: 54%|#####3 | 51/95 [00:34<00:29, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.8923, LAS: 0.8088, UEM: 0.3921, LEM: 0.1524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2080, partial_loss/deprel_loss: 1.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4113, loss: 1.3055, batch_reg_loss: 0.0658, reg_loss: 0.0654 ||: 57%|#####6 | 54/95 [00:36<00:28, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.8919, LAS: 0.8083, UEM: 0.3842, LEM: 0.1482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7063, partial_loss/deprel_loss: 0.9721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9848, loss: 1.3098, batch_reg_loss: 0.0658, reg_loss: 0.0654 ||: 60%|###### | 57/95 [00:38<00:26, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8125, UAS: 0.8930, LAS: 0.8092, UEM: 0.3777, LEM: 0.1422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9309, partial_loss/deprel_loss: 1.2323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2379, loss: 1.3015, batch_reg_loss: 0.0659, reg_loss: 0.0654 ||: 64%|######4 | 61/95 [00:41<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8311, UAS: 0.8943, LAS: 0.8108, UEM: 0.3858, LEM: 0.1472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8321, partial_loss/deprel_loss: 1.1460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1492, loss: 1.2876, batch_reg_loss: 0.0659, reg_loss: 0.0654 ||: 67%|######7 | 64/95 [00:43<00:20, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.8929, LAS: 0.8095, UEM: 0.3785, LEM: 0.1434, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9436, partial_loss/deprel_loss: 1.1526, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1768, loss: 1.2997, batch_reg_loss: 0.0660, reg_loss: 0.0655 ||: 71%|####### | 67/95 [00:45<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8328, UAS: 0.8940, LAS: 0.8105, UEM: 0.3968, LEM: 0.1612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7408, partial_loss/deprel_loss: 1.0109, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0229, loss: 1.2885, batch_reg_loss: 0.0661, reg_loss: 0.0655 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.8952, LAS: 0.8120, UEM: 0.4145, LEM: 0.1751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4338, partial_loss/deprel_loss: 0.7239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7320, loss: 1.2735, batch_reg_loss: 0.0661, reg_loss: 0.0655 ||: 78%|#######7 | 74/95 [00:50<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6697, UAS: 0.8933, LAS: 0.8103, UEM: 0.4239, LEM: 0.1847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4333, partial_loss/deprel_loss: 2.4425, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7068, loss: 1.2919, batch_reg_loss: 0.0662, reg_loss: 0.0655 ||: 81%|########1 | 77/95 [00:52<00:12, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.8938, LAS: 0.8106, UEM: 0.4234, LEM: 0.1836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4158, partial_loss/deprel_loss: 0.7884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7801, loss: 1.2873, batch_reg_loss: 0.0662, reg_loss: 0.0656 ||: 84%|########4 | 80/95 [00:54<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8292, UAS: 0.8952, LAS: 0.8125, UEM: 0.4462, LEM: 0.2108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8022, partial_loss/deprel_loss: 1.0705, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0831, loss: 1.2711, batch_reg_loss: 0.0663, reg_loss: 0.0656 ||: 87%|########7 | 83/95 [00:57<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.8952, LAS: 0.8127, UEM: 0.4400, LEM: 0.2055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1483, partial_loss/deprel_loss: 1.3003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3363, loss: 1.2698, batch_reg_loss: 0.0663, reg_loss: 0.0656 ||: 92%|#########1| 87/95 [00:59<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8966, LAS: 0.8144, UEM: 0.4516, LEM: 0.2121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4225, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 1.2534, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||: 95%|#########4| 90/95 [01:01<00:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.8979, LAS: 0.8161, UEM: 0.4584, LEM: 0.2137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6116, partial_loss/deprel_loss: 0.9072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9145, loss: 1.2385, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||: 98%|#########7| 93/95 [01:04<00:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.8987, LAS: 0.8170, UEM: 0.4618, LEM: 0.2129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4434, partial_loss/deprel_loss: 0.7938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 1.2303, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - reg_loss | 0.066 | N/A\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - UEM | 0.462 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LEM | 0.213 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - EM | 0.871 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.443 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - UAS | 0.899 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.794 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - loss | 1.230 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LAS | 0.817 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:54,604 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:54,604 - INFO - combo.training.trainer - Epoch duration: 0:01:06.081709\n", + "2023-04-06 23:00:54,604 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:57\n", + "2023-04-06 23:00:54,604 - INFO - allennlp.training.trainer - Epoch 10/399\n", + "2023-04-06 23:00:54,605 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:00:54,605 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:00:54,611 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7031, UAS: 0.8218, LAS: 0.7323, UEM: 0.0305, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5298, partial_loss/deprel_loss: 2.0268, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1939, loss: 1.9374, batch_reg_loss: 0.0665, reg_loss: 0.0665 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.8586, LAS: 0.7740, UEM: 0.3208, LEM: 0.1694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2965, partial_loss/deprel_loss: 1.2639, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3370, loss: 1.5704, batch_reg_loss: 0.0665, reg_loss: 0.0665 ||: 6%|6 | 6/95 [00:04<01:02, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.8798, LAS: 0.7985, UEM: 0.4239, LEM: 0.1836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0467, partial_loss/deprel_loss: 1.1728, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2142, loss: 1.3446, batch_reg_loss: 0.0666, reg_loss: 0.0665 ||: 9%|9 | 9/95 [00:06<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.8914, LAS: 0.8105, UEM: 0.4657, LEM: 0.2098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6000, partial_loss/deprel_loss: 0.8910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8994, loss: 1.2475, batch_reg_loss: 0.0666, reg_loss: 0.0665 ||: 13%|#2 | 12/95 [00:09<01:02, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7631, UAS: 0.8833, LAS: 0.8005, UEM: 0.4205, LEM: 0.1888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6921, partial_loss/deprel_loss: 1.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7128, loss: 1.3505, batch_reg_loss: 0.0667, reg_loss: 0.0666 ||: 16%|#5 | 15/95 [00:11<00:59, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7271, UAS: 0.8819, LAS: 0.7994, UEM: 0.3897, LEM: 0.1691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5832, partial_loss/deprel_loss: 2.1145, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2749, loss: 1.3850, batch_reg_loss: 0.0667, reg_loss: 0.0666 ||: 19%|#8 | 18/95 [00:13<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8399, UAS: 0.8877, LAS: 0.8062, UEM: 0.4351, LEM: 0.2032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7033, partial_loss/deprel_loss: 0.9579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9737, loss: 1.3229, batch_reg_loss: 0.0668, reg_loss: 0.0666 ||: 22%|##2 | 21/95 [00:15<00:53, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8016, UAS: 0.8911, LAS: 0.8099, UEM: 0.4368, LEM: 0.2001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0288, partial_loss/deprel_loss: 1.3583, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3592, loss: 1.2861, batch_reg_loss: 0.0668, reg_loss: 0.0666 ||: 25%|##5 | 24/95 [00:17<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8398, UAS: 0.8934, LAS: 0.8121, UEM: 0.4386, LEM: 0.1962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7464, partial_loss/deprel_loss: 1.0831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0827, loss: 1.2714, batch_reg_loss: 0.0669, reg_loss: 0.0667 ||: 28%|##8 | 27/95 [00:19<00:49, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.8953, LAS: 0.8150, UEM: 0.4853, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2152, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4406, loss: 1.2412, batch_reg_loss: 0.0669, reg_loss: 0.0667 ||: 32%|###1 | 30/95 [00:22<00:46, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8608, UAS: 0.8960, LAS: 0.8154, UEM: 0.4780, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5071, partial_loss/deprel_loss: 0.8553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8526, loss: 1.2423, batch_reg_loss: 0.0670, reg_loss: 0.0667 ||: 36%|###5 | 34/95 [00:25<00:44, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.8996, LAS: 0.8191, UEM: 0.4871, LEM: 0.2348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.7316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7375, loss: 1.2090, batch_reg_loss: 0.0670, reg_loss: 0.0667 ||: 40%|#### | 38/95 [00:27<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.8994, LAS: 0.8188, UEM: 0.4778, LEM: 0.2275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6680, partial_loss/deprel_loss: 0.9297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9444, loss: 1.2127, batch_reg_loss: 0.0671, reg_loss: 0.0668 ||: 43%|####3 | 41/95 [00:29<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.8999, LAS: 0.8193, UEM: 0.4624, LEM: 0.2162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4983, partial_loss/deprel_loss: 1.5294, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5904, loss: 1.2083, batch_reg_loss: 0.0672, reg_loss: 0.0668 ||: 47%|####7 | 45/95 [00:32<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7780, UAS: 0.9007, LAS: 0.8201, UEM: 0.4617, LEM: 0.2117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4568, partial_loss/deprel_loss: 1.5623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6084, loss: 1.2016, batch_reg_loss: 0.0672, reg_loss: 0.0668 ||: 51%|##### | 48/95 [00:34<00:33, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7926, UAS: 0.9010, LAS: 0.8206, UEM: 0.4518, LEM: 0.2046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2942, partial_loss/deprel_loss: 1.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3907, loss: 1.1957, batch_reg_loss: 0.0673, reg_loss: 0.0669 ||: 55%|#####4 | 52/95 [00:37<00:29, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.8989, LAS: 0.8185, UEM: 0.4463, LEM: 0.2011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5744, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8179, loss: 1.2127, batch_reg_loss: 0.0673, reg_loss: 0.0669 ||: 59%|#####8 | 56/95 [00:39<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9001, LAS: 0.8200, UEM: 0.4409, LEM: 0.1938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7566, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0544, loss: 1.2014, batch_reg_loss: 0.0674, reg_loss: 0.0669 ||: 63%|######3 | 60/95 [00:41<00:22, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9013, LAS: 0.8216, UEM: 0.4710, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 0.7125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7222, loss: 1.1868, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||: 67%|######7 | 64/95 [00:45<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7727, UAS: 0.9012, LAS: 0.8212, UEM: 0.4776, LEM: 0.2361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4438, partial_loss/deprel_loss: 1.4439, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5114, loss: 1.1869, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||: 71%|####### | 67/95 [00:47<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8169, UAS: 0.9016, LAS: 0.8213, UEM: 0.4723, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8432, partial_loss/deprel_loss: 1.1341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1435, loss: 1.1835, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||: 74%|#######3 | 70/95 [00:49<00:17, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6733, UAS: 0.9001, LAS: 0.8197, UEM: 0.4714, LEM: 0.2294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2788, partial_loss/deprel_loss: 2.4155, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6558, loss: 1.2007, batch_reg_loss: 0.0676, reg_loss: 0.0670 ||: 77%|#######6 | 73/95 [00:51<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8649, UAS: 0.9007, LAS: 0.8207, UEM: 0.4757, LEM: 0.2318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.8426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8417, loss: 1.1912, batch_reg_loss: 0.0676, reg_loss: 0.0671 ||: 80%|######## | 76/95 [00:54<00:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8503, UAS: 0.9007, LAS: 0.8207, UEM: 0.4681, LEM: 0.2252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7483, partial_loss/deprel_loss: 0.9126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9475, loss: 1.1914, batch_reg_loss: 0.0677, reg_loss: 0.0671 ||: 84%|########4 | 80/95 [00:56<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7666, UAS: 0.9010, LAS: 0.8212, UEM: 0.4685, LEM: 0.2241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8265, partial_loss/deprel_loss: 1.6867, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7824, loss: 1.1903, batch_reg_loss: 0.0678, reg_loss: 0.0671 ||: 88%|########8 | 84/95 [00:59<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9010, LAS: 0.8213, UEM: 0.4681, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7418, partial_loss/deprel_loss: 1.0076, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0223, loss: 1.1896, batch_reg_loss: 0.0678, reg_loss: 0.0671 ||: 92%|#########1| 87/95 [01:01<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8071, UAS: 0.9017, LAS: 0.8221, UEM: 0.4660, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1855, partial_loss/deprel_loss: 1.3873, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4148, loss: 1.1838, batch_reg_loss: 0.0679, reg_loss: 0.0672 ||: 96%|#########5| 91/95 [01:04<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7212, UAS: 0.9013, LAS: 0.8217, UEM: 0.4694, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4279, partial_loss/deprel_loss: 1.9875, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1436, loss: 1.1866, batch_reg_loss: 0.0680, reg_loss: 0.0672 ||: 99%|#########8| 94/95 [01:06<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8137, UAS: 0.9012, LAS: 0.8216, UEM: 0.4672, LEM: 0.2210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0853, partial_loss/deprel_loss: 1.1440, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2002, loss: 1.1868, batch_reg_loss: 0.0680, reg_loss: 0.0672 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-06 23:02:01,360 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8164, UAS: 0.9162, LAS: 0.8416, UEM: 0.4038, LEM: 0.1126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5261, partial_loss/deprel_loss: 52.2277, partial_loss/cycle_loss: 0.0000, batch_loss: 42.0874, loss: 27.9840, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9343, LAS: 0.8675, UEM: 0.6663, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 18.2171, partial_loss/cycle_loss: 0.0000, batch_loss: 14.6289, loss: 23.2585, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9326, LAS: 0.8625, UEM: 0.5833, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9777, partial_loss/deprel_loss: 40.0335, partial_loss/cycle_loss: 0.0000, batch_loss: 32.2224, loss: 23.8342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9337, LAS: 0.8647, UEM: 0.6010, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2426, partial_loss/deprel_loss: 20.5975, partial_loss/cycle_loss: 0.0000, batch_loss: 16.5265, loss: 24.2762, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9363, LAS: 0.8680, UEM: 0.6106, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3556, partial_loss/deprel_loss: 25.5258, partial_loss/cycle_loss: 0.0000, batch_loss: 20.4918, loss: 23.9322, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.06it/s]\n", + "2023-04-06 23:02:11,763 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - reg_loss | 0.067 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UEM | 0.467 | 0.611\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - LEM | 0.221 | 0.321\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EM | 0.814 | 0.901\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.085 | 0.356\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UAS | 0.901 | 0.936\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.144 | 25.526\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - loss | 1.187 | 23.932\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - LAS | 0.822 | 0.868\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.trainer - Epoch duration: 0:01:17.160911\n", + "2023-04-06 23:02:11,765 - INFO - combo.training.trainer - Estimated training time remaining: 7:25:19\n", + "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - Epoch 11/399\n", + "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:02:11,773 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9371, LAS: 0.8700, UEM: 0.7673, LEM: 0.5902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0930, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3007, loss: 0.7984, batch_reg_loss: 0.0680, reg_loss: 0.0680 ||: 3%|3 | 3/95 [00:02<01:15, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8207, UAS: 0.9161, LAS: 0.8430, UEM: 0.6421, LEM: 0.4579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1003, partial_loss/deprel_loss: 1.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2884, loss: 1.0284, batch_reg_loss: 0.0681, reg_loss: 0.0680 ||: 6%|6 | 6/95 [00:04<01:10, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9152, LAS: 0.8389, UEM: 0.5687, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3384, partial_loss/deprel_loss: 0.6925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6898, loss: 1.0641, batch_reg_loss: 0.0681, reg_loss: 0.0681 ||: 11%|# | 10/95 [00:07<01:03, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7988, UAS: 0.9111, LAS: 0.8337, UEM: 0.5121, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3444, partial_loss/deprel_loss: 1.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4147, loss: 1.1073, batch_reg_loss: 0.0682, reg_loss: 0.0681 ||: 15%|#4 | 14/95 [00:09<00:56, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8031, UAS: 0.9140, LAS: 0.8370, UEM: 0.5409, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2805, partial_loss/deprel_loss: 1.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4183, loss: 1.0751, batch_reg_loss: 0.0683, reg_loss: 0.0681 ||: 18%|#7 | 17/95 [00:12<00:57, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9148, LAS: 0.8375, UEM: 0.5036, LEM: 0.2682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6595, partial_loss/deprel_loss: 0.9234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9390, loss: 1.0632, batch_reg_loss: 0.0683, reg_loss: 0.0682 ||: 22%|##2 | 21/95 [00:14<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7154, UAS: 0.9141, LAS: 0.8375, UEM: 0.5521, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7330, partial_loss/deprel_loss: 2.0155, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2274, loss: 1.0689, batch_reg_loss: 0.0684, reg_loss: 0.0682 ||: 25%|##5 | 24/95 [00:16<00:50, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9145, LAS: 0.8378, UEM: 0.5380, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6724, partial_loss/deprel_loss: 0.9636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9739, loss: 1.0667, batch_reg_loss: 0.0685, reg_loss: 0.0682 ||: 29%|##9 | 28/95 [00:19<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9145, LAS: 0.8375, UEM: 0.5314, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3632, partial_loss/deprel_loss: 0.6049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6251, loss: 1.0675, batch_reg_loss: 0.0685, reg_loss: 0.0683 ||: 33%|###2 | 31/95 [00:21<00:46, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9122, LAS: 0.8351, UEM: 0.5227, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4412, partial_loss/deprel_loss: 0.7872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 1.0905, batch_reg_loss: 0.0686, reg_loss: 0.0683 ||: 36%|###5 | 34/95 [00:23<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9136, LAS: 0.8364, UEM: 0.5206, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6975, partial_loss/deprel_loss: 0.9374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9580, loss: 1.0752, batch_reg_loss: 0.0686, reg_loss: 0.0683 ||: 39%|###8 | 37/95 [00:26<00:44, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8514, UAS: 0.9136, LAS: 0.8363, UEM: 0.5173, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6055, partial_loss/deprel_loss: 0.9506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9503, loss: 1.0753, batch_reg_loss: 0.0687, reg_loss: 0.0683 ||: 42%|####2 | 40/95 [00:28<00:40, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7790, UAS: 0.9144, LAS: 0.8375, UEM: 0.5324, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4415, partial_loss/deprel_loss: 1.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4988, loss: 1.0630, batch_reg_loss: 0.0688, reg_loss: 0.0684 ||: 45%|####5 | 43/95 [00:30<00:39, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9137, LAS: 0.8369, UEM: 0.5255, LEM: 0.2673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.8005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8268, loss: 1.0684, batch_reg_loss: 0.0688, reg_loss: 0.0684 ||: 48%|####8 | 46/95 [00:33<00:36, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9121, LAS: 0.8351, UEM: 0.5167, LEM: 0.2606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3658, partial_loss/deprel_loss: 0.6982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7006, loss: 1.0860, batch_reg_loss: 0.0689, reg_loss: 0.0684 ||: 53%|#####2 | 50/95 [00:35<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.9100, LAS: 0.8325, UEM: 0.5021, LEM: 0.2508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9662, partial_loss/deprel_loss: 1.8036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9051, loss: 1.1094, batch_reg_loss: 0.0690, reg_loss: 0.0685 ||: 57%|#####6 | 54/95 [00:37<00:26, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9099, LAS: 0.8327, UEM: 0.5038, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9425, loss: 1.1041, batch_reg_loss: 0.0690, reg_loss: 0.0685 ||: 61%|######1 | 58/95 [00:40<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9098, LAS: 0.8327, UEM: 0.5115, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2085, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5077, loss: 1.1045, batch_reg_loss: 0.0691, reg_loss: 0.0685 ||: 65%|######5 | 62/95 [00:43<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.9075, LAS: 0.8304, UEM: 0.5118, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3136, partial_loss/deprel_loss: 1.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3928, loss: 1.1248, batch_reg_loss: 0.0692, reg_loss: 0.0686 ||: 68%|######8 | 65/95 [00:45<00:21, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9087, LAS: 0.8316, UEM: 0.5187, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3529, partial_loss/deprel_loss: 0.5969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 1.1125, batch_reg_loss: 0.0692, reg_loss: 0.0686 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9087, LAS: 0.8316, UEM: 0.5122, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3889, partial_loss/deprel_loss: 0.6496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6668, loss: 1.1118, batch_reg_loss: 0.0693, reg_loss: 0.0686 ||: 76%|#######5 | 72/95 [00:50<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9078, LAS: 0.8307, UEM: 0.4999, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0150, partial_loss/deprel_loss: 1.2229, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2507, loss: 1.1199, batch_reg_loss: 0.0694, reg_loss: 0.0687 ||: 80%|######## | 76/95 [00:52<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.9065, LAS: 0.8292, UEM: 0.4924, LEM: 0.2422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8164, partial_loss/deprel_loss: 1.5329, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6591, loss: 1.1326, batch_reg_loss: 0.0695, reg_loss: 0.0687 ||: 84%|########4 | 80/95 [00:54<00:09, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9077, LAS: 0.8305, UEM: 0.5010, LEM: 0.2464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7163, loss: 1.1202, batch_reg_loss: 0.0695, reg_loss: 0.0687 ||: 88%|########8 | 84/95 [00:57<00:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8075, UAS: 0.9064, LAS: 0.8288, UEM: 0.4941, LEM: 0.2412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0405, partial_loss/deprel_loss: 1.2673, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2915, loss: 1.1359, batch_reg_loss: 0.0696, reg_loss: 0.0688 ||: 93%|#########2| 88/95 [01:00<00:04, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8281, UAS: 0.9071, LAS: 0.8296, UEM: 0.4892, LEM: 0.2361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8237, partial_loss/deprel_loss: 1.0912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1074, loss: 1.1295, batch_reg_loss: 0.0697, reg_loss: 0.0688 ||: 97%|#########6| 92/95 [01:02<00:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7914, UAS: 0.9071, LAS: 0.8296, UEM: 0.4845, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3436, partial_loss/deprel_loss: 1.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4480, loss: 1.1300, batch_reg_loss: 0.0697, reg_loss: 0.0688 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer - reg_loss | 0.069 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UEM | 0.484 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LEM | 0.232 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EM | 0.791 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.344 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UAS | 0.907 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.387 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - loss | 1.130 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LAS | 0.830 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:03:16,352 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:16,352 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:16,352 - INFO - combo.training.trainer - Epoch duration: 0:01:04.586566\n", + "2023-04-06 23:03:16,352 - INFO - combo.training.trainer - Estimated training time remaining: 7:21:58\n", + "2023-04-06 23:03:16,352 - INFO - allennlp.training.trainer - Epoch 12/399\n", + "2023-04-06 23:03:16,352 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:03:16,353 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:03:16,359 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9142, LAS: 0.8380, UEM: 0.5825, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8646, partial_loss/deprel_loss: 1.2057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2073, loss: 1.0739, batch_reg_loss: 0.0698, reg_loss: 0.0698 ||: 3%|3 | 3/95 [00:02<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9034, LAS: 0.8276, UEM: 0.6364, LEM: 0.4222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1870, partial_loss/deprel_loss: 0.4088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 1.1700, batch_reg_loss: 0.0698, reg_loss: 0.0698 ||: 6%|6 | 6/95 [00:04<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9081, LAS: 0.8352, UEM: 0.7177, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5395, partial_loss/deprel_loss: 1.5154, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5901, loss: 1.1147, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||: 8%|8 | 8/95 [00:08<01:36, 1.10s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9166, LAS: 0.8453, UEM: 0.6879, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.6113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6359, loss: 1.0103, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||: 12%|#1 | 11/95 [00:10<01:24, 1.01s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9076, LAS: 0.8340, UEM: 0.6387, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7420, partial_loss/deprel_loss: 1.0690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0736, loss: 1.1095, batch_reg_loss: 0.0700, reg_loss: 0.0699 ||: 15%|#4 | 14/95 [00:13<01:15, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8029, UAS: 0.9005, LAS: 0.8259, UEM: 0.5868, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3702, partial_loss/deprel_loss: 1.3301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4082, loss: 1.1735, batch_reg_loss: 0.0701, reg_loss: 0.0699 ||: 19%|#8 | 18/95 [00:15<01:04, 1.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9052, LAS: 0.8306, UEM: 0.5698, LEM: 0.3542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4813, partial_loss/deprel_loss: 0.7393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7578, loss: 1.1321, batch_reg_loss: 0.0701, reg_loss: 0.0699 ||: 22%|##2 | 21/95 [00:17<01:00, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8127, UAS: 0.9013, LAS: 0.8258, UEM: 0.5385, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1662, partial_loss/deprel_loss: 1.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3917, loss: 1.1798, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||: 25%|##5 | 24/95 [00:19<00:54, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9033, LAS: 0.8286, UEM: 0.5236, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6162, partial_loss/deprel_loss: 0.7490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7927, loss: 1.1548, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||: 28%|##8 | 27/95 [00:21<00:51, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8474, UAS: 0.9078, LAS: 0.8336, UEM: 0.5471, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6983, partial_loss/deprel_loss: 1.0023, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0118, loss: 1.1121, batch_reg_loss: 0.0703, reg_loss: 0.0700 ||: 32%|###1 | 30/95 [00:24<00:48, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7711, UAS: 0.9058, LAS: 0.8310, UEM: 0.5267, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7300, partial_loss/deprel_loss: 1.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6616, loss: 1.1349, batch_reg_loss: 0.0704, reg_loss: 0.0700 ||: 35%|###4 | 33/95 [00:26<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8769, UAS: 0.9046, LAS: 0.8294, UEM: 0.5203, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.6940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 1.1464, batch_reg_loss: 0.0704, reg_loss: 0.0701 ||: 38%|###7 | 36/95 [00:28<00:45, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9070, LAS: 0.8316, UEM: 0.5123, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8512, partial_loss/deprel_loss: 1.1832, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1873, loss: 1.1284, batch_reg_loss: 0.0705, reg_loss: 0.0701 ||: 42%|####2 | 40/95 [00:31<00:38, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9052, LAS: 0.8290, UEM: 0.4983, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4265, partial_loss/deprel_loss: 0.8326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8220, loss: 1.1563, batch_reg_loss: 0.0706, reg_loss: 0.0702 ||: 46%|####6 | 44/95 [00:33<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8177, UAS: 0.9056, LAS: 0.8295, UEM: 0.4901, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9502, partial_loss/deprel_loss: 1.1176, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1547, loss: 1.1493, batch_reg_loss: 0.0707, reg_loss: 0.0702 ||: 49%|####9 | 47/95 [00:35<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9061, LAS: 0.8299, UEM: 0.4935, LEM: 0.2593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5518, partial_loss/deprel_loss: 0.8065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8263, loss: 1.1427, batch_reg_loss: 0.0707, reg_loss: 0.0702 ||: 53%|#####2 | 50/95 [00:38<00:32, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9074, LAS: 0.8313, UEM: 0.4914, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5048, partial_loss/deprel_loss: 0.7113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7408, loss: 1.1276, batch_reg_loss: 0.0708, reg_loss: 0.0703 ||: 56%|#####5 | 53/95 [00:40<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9088, LAS: 0.8330, UEM: 0.4917, LEM: 0.2485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5163, partial_loss/deprel_loss: 0.7191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7494, loss: 1.1115, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||: 59%|#####8 | 56/95 [00:42<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7491, UAS: 0.9080, LAS: 0.8324, UEM: 0.4943, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1553, partial_loss/deprel_loss: 1.5914, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7751, loss: 1.1141, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||: 62%|######2 | 59/95 [00:44<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9075, LAS: 0.8318, UEM: 0.4819, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6134, partial_loss/deprel_loss: 0.8982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9122, loss: 1.1176, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||: 66%|######6 | 63/95 [00:46<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9076, LAS: 0.8317, UEM: 0.4790, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0133, partial_loss/deprel_loss: 1.2214, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2509, loss: 1.1179, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||: 69%|######9 | 66/95 [00:49<00:20, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9067, LAS: 0.8308, UEM: 0.4723, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.8242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8391, loss: 1.1274, batch_reg_loss: 0.0711, reg_loss: 0.0704 ||: 73%|#######2 | 69/95 [00:51<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8457, UAS: 0.9068, LAS: 0.8308, UEM: 0.4759, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7431, partial_loss/deprel_loss: 0.9755, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0002, loss: 1.1290, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||: 77%|#######6 | 73/95 [00:54<00:15, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9068, LAS: 0.8307, UEM: 0.4711, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0499, partial_loss/deprel_loss: 1.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2433, loss: 1.1291, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||: 80%|######## | 76/95 [00:56<00:13, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9062, LAS: 0.8303, UEM: 0.4706, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4272, partial_loss/deprel_loss: 0.7090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7240, loss: 1.1358, batch_reg_loss: 0.0713, reg_loss: 0.0705 ||: 84%|########4 | 80/95 [00:58<00:10, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9063, LAS: 0.8304, UEM: 0.4649, LEM: 0.2238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 1.0563, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0663, loss: 1.1354, batch_reg_loss: 0.0714, reg_loss: 0.0706 ||: 88%|########8 | 84/95 [01:01<00:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9080, LAS: 0.8324, UEM: 0.4830, LEM: 0.2363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3591, partial_loss/deprel_loss: 0.6660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 1.1192, batch_reg_loss: 0.0715, reg_loss: 0.0706 ||: 93%|#########2| 88/95 [01:03<00:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9089, LAS: 0.8334, UEM: 0.4855, LEM: 0.2353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3223, partial_loss/deprel_loss: 0.6439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6511, loss: 1.1072, batch_reg_loss: 0.0716, reg_loss: 0.0706 ||: 97%|#########6| 92/95 [01:06<00:01, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9097, LAS: 0.8345, UEM: 0.4884, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6029, partial_loss/deprel_loss: 0.8348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8601, loss: 1.0974, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||: 100%|##########| 95/95 [01:08<00:00, 1.40it/s]\n", + "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer - reg_loss | 0.071 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UEM | 0.488 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LEM | 0.235 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EM | 0.863 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.603 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UAS | 0.910 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.835 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - loss | 1.097 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LAS | 0.835 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:04:24,429 - INFO - combo.training.trainer - Epoch duration: 0:01:08.076904\n", + "2023-04-06 23:04:24,429 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:41\n", + "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - Epoch 13/399\n", + "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:04:24,436 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8559, UAS: 0.9381, LAS: 0.8680, UEM: 0.6473, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8799, loss: 0.7820, batch_reg_loss: 0.0717, reg_loss: 0.0717 ||: 4%|4 | 4/95 [00:02<00:55, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.9090, LAS: 0.8358, UEM: 0.5967, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3901, partial_loss/deprel_loss: 1.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4911, loss: 1.0766, batch_reg_loss: 0.0718, reg_loss: 0.0717 ||: 7%|7 | 7/95 [00:04<00:56, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9142, LAS: 0.8405, UEM: 0.5602, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3589, partial_loss/deprel_loss: 0.5954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6199, loss: 1.0375, batch_reg_loss: 0.0718, reg_loss: 0.0717 ||: 12%|#1 | 11/95 [00:07<00:53, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9187, LAS: 0.8454, UEM: 0.5227, LEM: 0.2421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8380, partial_loss/deprel_loss: 1.0987, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1185, loss: 1.0070, batch_reg_loss: 0.0719, reg_loss: 0.0718 ||: 16%|#5 | 15/95 [00:09<00:49, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9218, LAS: 0.8490, UEM: 0.5440, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2444, partial_loss/deprel_loss: 0.5095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.9723, batch_reg_loss: 0.0720, reg_loss: 0.0718 ||: 20%|## | 19/95 [00:11<00:47, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9254, LAS: 0.8535, UEM: 0.5707, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4998, partial_loss/deprel_loss: 0.7194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7475, loss: 0.9289, batch_reg_loss: 0.0720, reg_loss: 0.0718 ||: 23%|##3 | 22/95 [00:14<00:47, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9244, LAS: 0.8525, UEM: 0.5700, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7205, partial_loss/deprel_loss: 0.9875, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0062, loss: 0.9452, batch_reg_loss: 0.0721, reg_loss: 0.0719 ||: 26%|##6 | 25/95 [00:16<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9257, LAS: 0.8542, UEM: 0.5648, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.6602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6798, loss: 0.9305, batch_reg_loss: 0.0721, reg_loss: 0.0719 ||: 29%|##9 | 28/95 [00:18<00:45, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9247, LAS: 0.8526, UEM: 0.5489, LEM: 0.2609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6482, partial_loss/deprel_loss: 0.8613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8909, loss: 0.9451, batch_reg_loss: 0.0722, reg_loss: 0.0719 ||: 34%|###3 | 32/95 [00:20<00:42, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9219, LAS: 0.8491, UEM: 0.5345, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5332, partial_loss/deprel_loss: 0.8294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8425, loss: 0.9753, batch_reg_loss: 0.0723, reg_loss: 0.0720 ||: 37%|###6 | 35/95 [00:23<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8058, UAS: 0.9230, LAS: 0.8511, UEM: 0.5672, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1614, partial_loss/deprel_loss: 1.1866, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2539, loss: 0.9600, batch_reg_loss: 0.0723, reg_loss: 0.0720 ||: 40%|#### | 38/95 [00:25<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7790, UAS: 0.9219, LAS: 0.8504, UEM: 0.5568, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5085, partial_loss/deprel_loss: 1.4547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5378, loss: 0.9640, batch_reg_loss: 0.0724, reg_loss: 0.0720 ||: 44%|####4 | 42/95 [00:28<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9209, LAS: 0.8496, UEM: 0.5509, LEM: 0.2868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4107, partial_loss/deprel_loss: 0.6130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.9750, batch_reg_loss: 0.0725, reg_loss: 0.0721 ||: 47%|####7 | 45/95 [00:30<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9199, LAS: 0.8483, UEM: 0.5340, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.9725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9852, loss: 0.9868, batch_reg_loss: 0.0725, reg_loss: 0.0721 ||: 52%|#####1 | 49/95 [00:32<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9180, LAS: 0.8463, UEM: 0.5306, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.6815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6944, loss: 1.0060, batch_reg_loss: 0.0726, reg_loss: 0.0721 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8418, UAS: 0.9184, LAS: 0.8466, UEM: 0.5256, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7632, partial_loss/deprel_loss: 0.9772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 1.0007, batch_reg_loss: 0.0727, reg_loss: 0.0722 ||: 59%|#####8 | 56/95 [00:37<00:26, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7729, UAS: 0.9164, LAS: 0.8441, UEM: 0.5115, LEM: 0.2566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5636, partial_loss/deprel_loss: 1.4738, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5645, loss: 1.0198, batch_reg_loss: 0.0728, reg_loss: 0.0722 ||: 63%|######3 | 60/95 [00:39<00:22, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7463, UAS: 0.9147, LAS: 0.8422, UEM: 0.5032, LEM: 0.2503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0702, partial_loss/deprel_loss: 1.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8317, loss: 1.0350, batch_reg_loss: 0.0729, reg_loss: 0.0722 ||: 67%|######7 | 64/95 [00:42<00:19, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9151, LAS: 0.8426, UEM: 0.5026, LEM: 0.2482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.8218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8573, loss: 1.0305, batch_reg_loss: 0.0730, reg_loss: 0.0723 ||: 72%|#######1 | 68/95 [00:45<00:18, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7964, UAS: 0.9153, LAS: 0.8428, UEM: 0.5113, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4143, partial_loss/deprel_loss: 1.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4779, loss: 1.0303, batch_reg_loss: 0.0730, reg_loss: 0.0723 ||: 75%|#######4 | 71/95 [00:48<00:18, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9132, LAS: 0.8403, UEM: 0.5022, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6510, partial_loss/deprel_loss: 1.4862, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5923, loss: 1.0526, batch_reg_loss: 0.0731, reg_loss: 0.0723 ||: 79%|#######8 | 75/95 [00:50<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9131, LAS: 0.8403, UEM: 0.4988, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8652, partial_loss/deprel_loss: 0.9862, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0352, loss: 1.0537, batch_reg_loss: 0.0732, reg_loss: 0.0724 ||: 83%|########3 | 79/95 [00:53<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9131, LAS: 0.8402, UEM: 0.4962, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4240, partial_loss/deprel_loss: 0.7195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7337, loss: 1.0538, batch_reg_loss: 0.0733, reg_loss: 0.0724 ||: 86%|########6 | 82/95 [00:55<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9123, LAS: 0.8394, UEM: 0.4930, LEM: 0.2456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4785, partial_loss/deprel_loss: 0.7711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7859, loss: 1.0607, batch_reg_loss: 0.0733, reg_loss: 0.0725 ||: 89%|########9 | 85/95 [00:57<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9126, LAS: 0.8397, UEM: 0.5022, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4379, partial_loss/deprel_loss: 0.8143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8124, loss: 1.0589, batch_reg_loss: 0.0734, reg_loss: 0.0725 ||: 93%|#########2| 88/95 [00:59<00:05, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9123, LAS: 0.8392, UEM: 0.4962, LEM: 0.2488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3830, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6806, loss: 1.0621, batch_reg_loss: 0.0735, reg_loss: 0.0725 ||: 97%|#########6| 92/95 [01:02<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9117, LAS: 0.8385, UEM: 0.4926, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5572, partial_loss/deprel_loss: 0.7749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8049, loss: 1.0700, batch_reg_loss: 0.0735, reg_loss: 0.0726 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - reg_loss | 0.073 | N/A\n", + "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UEM | 0.493 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LEM | 0.245 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - EM | 0.876 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.557 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UAS | 0.912 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.775 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - loss | 1.070 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LAS | 0.838 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.907 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:28,664 - INFO - combo.training.trainer - Epoch duration: 0:01:04.234400\n", + "2023-04-06 23:05:28,664 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:40\n", + "2023-04-06 23:05:28,664 - INFO - allennlp.training.trainer - Epoch 14/399\n", + "2023-04-06 23:05:28,664 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:05:28,665 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:05:28,670 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8995, LAS: 0.8276, UEM: 0.4028, LEM: 0.1517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.7889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8084, loss: 1.1586, batch_reg_loss: 0.0736, reg_loss: 0.0736 ||: 3%|3 | 3/95 [00:02<01:07, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8122, UAS: 0.9089, LAS: 0.8349, UEM: 0.4075, LEM: 0.1567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2148, partial_loss/deprel_loss: 1.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3207, loss: 1.0912, batch_reg_loss: 0.0737, reg_loss: 0.0736 ||: 6%|6 | 6/95 [00:04<01:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9115, LAS: 0.8384, UEM: 0.3569, LEM: 0.1226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0056, partial_loss/deprel_loss: 1.0178, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0892, loss: 1.0504, batch_reg_loss: 0.0738, reg_loss: 0.0737 ||: 11%|# | 10/95 [00:06<00:58, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9078, LAS: 0.8351, UEM: 0.4315, LEM: 0.1907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 1.0827, batch_reg_loss: 0.0738, reg_loss: 0.0737 ||: 14%|#3 | 13/95 [00:08<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9063, LAS: 0.8329, UEM: 0.4217, LEM: 0.1819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4802, partial_loss/deprel_loss: 0.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7768, loss: 1.1004, batch_reg_loss: 0.0739, reg_loss: 0.0737 ||: 18%|#7 | 17/95 [00:11<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7983, UAS: 0.9064, LAS: 0.8333, UEM: 0.4143, LEM: 0.1745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4510, partial_loss/deprel_loss: 1.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5131, loss: 1.1014, batch_reg_loss: 0.0740, reg_loss: 0.0738 ||: 21%|##1 | 20/95 [00:13<00:51, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9072, LAS: 0.8341, UEM: 0.4074, LEM: 0.1658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9802, partial_loss/deprel_loss: 1.0603, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1183, loss: 1.0997, batch_reg_loss: 0.0741, reg_loss: 0.0738 ||: 25%|##5 | 24/95 [00:15<00:46, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7769, UAS: 0.9086, LAS: 0.8357, UEM: 0.4271, LEM: 0.1792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6805, partial_loss/deprel_loss: 1.4625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5803, loss: 1.0884, batch_reg_loss: 0.0742, reg_loss: 0.0739 ||: 29%|##9 | 28/95 [00:18<00:42, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8238, UAS: 0.9128, LAS: 0.8405, UEM: 0.4980, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2294, partial_loss/deprel_loss: 1.1924, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2740, loss: 1.0447, batch_reg_loss: 0.0742, reg_loss: 0.0739 ||: 34%|###3 | 32/95 [00:21<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9143, LAS: 0.8424, UEM: 0.4999, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4578, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 1.0288, batch_reg_loss: 0.0743, reg_loss: 0.0739 ||: 37%|###6 | 35/95 [00:23<00:41, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9161, LAS: 0.8445, UEM: 0.5030, LEM: 0.2381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6349, loss: 1.0128, batch_reg_loss: 0.0744, reg_loss: 0.0740 ||: 40%|#### | 38/95 [00:25<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9150, LAS: 0.8434, UEM: 0.4975, LEM: 0.2359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4017, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 1.0182, batch_reg_loss: 0.0744, reg_loss: 0.0740 ||: 44%|####4 | 42/95 [00:28<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7646, UAS: 0.9144, LAS: 0.8432, UEM: 0.5281, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9945, partial_loss/deprel_loss: 1.5558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7180, loss: 1.0241, batch_reg_loss: 0.0745, reg_loss: 0.0740 ||: 47%|####7 | 45/95 [00:31<00:36, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9145, LAS: 0.8433, UEM: 0.5175, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.7959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7951, loss: 1.0231, batch_reg_loss: 0.0746, reg_loss: 0.0741 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9136, LAS: 0.8421, UEM: 0.5076, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7028, partial_loss/deprel_loss: 0.8929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9295, loss: 1.0349, batch_reg_loss: 0.0746, reg_loss: 0.0741 ||: 55%|#####4 | 52/95 [00:35<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9155, LAS: 0.8441, UEM: 0.5193, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3191, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6256, loss: 1.0190, batch_reg_loss: 0.0747, reg_loss: 0.0741 ||: 58%|#####7 | 55/95 [00:37<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.9151, LAS: 0.8434, UEM: 0.5131, LEM: 0.2629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8426, partial_loss/deprel_loss: 1.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2183, loss: 1.0272, batch_reg_loss: 0.0748, reg_loss: 0.0742 ||: 62%|######2 | 59/95 [00:40<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9160, LAS: 0.8443, UEM: 0.5126, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7857, partial_loss/deprel_loss: 1.0030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0343, loss: 1.0196, batch_reg_loss: 0.0748, reg_loss: 0.0742 ||: 65%|######5 | 62/95 [00:42<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9158, LAS: 0.8441, UEM: 0.5048, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8111, partial_loss/deprel_loss: 0.9532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9997, loss: 1.0238, batch_reg_loss: 0.0749, reg_loss: 0.0743 ||: 69%|######9 | 66/95 [00:44<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8682, UAS: 0.9161, LAS: 0.8444, UEM: 0.5025, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6108, partial_loss/deprel_loss: 0.7552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8013, loss: 1.0215, batch_reg_loss: 0.0750, reg_loss: 0.0743 ||: 74%|#######3 | 70/95 [00:47<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9148, LAS: 0.8428, UEM: 0.5010, LEM: 0.2483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3281, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 1.0366, batch_reg_loss: 0.0751, reg_loss: 0.0743 ||: 78%|#######7 | 74/95 [00:49<00:13, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9138, LAS: 0.8419, UEM: 0.4946, LEM: 0.2443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7095, partial_loss/deprel_loss: 0.9343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9645, loss: 1.0429, batch_reg_loss: 0.0752, reg_loss: 0.0744 ||: 82%|########2 | 78/95 [00:52<00:11, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.9139, LAS: 0.8420, UEM: 0.4931, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8576, partial_loss/deprel_loss: 1.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6679, loss: 1.0455, batch_reg_loss: 0.0753, reg_loss: 0.0744 ||: 86%|########6 | 82/95 [00:55<00:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9141, LAS: 0.8424, UEM: 0.5003, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0369, partial_loss/deprel_loss: 1.2106, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2512, loss: 1.0436, batch_reg_loss: 0.0754, reg_loss: 0.0745 ||: 91%|######### | 86/95 [00:58<00:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9140, LAS: 0.8425, UEM: 0.5041, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3531, partial_loss/deprel_loss: 0.5890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 1.0458, batch_reg_loss: 0.0754, reg_loss: 0.0745 ||: 94%|#########3| 89/95 [01:00<00:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.9140, LAS: 0.8425, UEM: 0.4988, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9683, partial_loss/deprel_loss: 1.0885, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1400, loss: 1.0450, batch_reg_loss: 0.0755, reg_loss: 0.0745 ||: 98%|#########7| 93/95 [01:03<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9147, LAS: 0.8433, UEM: 0.5042, LEM: 0.2521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3336, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6039, loss: 1.0379, batch_reg_loss: 0.0756, reg_loss: 0.0746 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - reg_loss | 0.075 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UEM | 0.504 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - LEM | 0.252 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EM | 0.887 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.334 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UAS | 0.915 | N/A\n", + "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.577 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - loss | 1.038 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - LAS | 0.843 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:06:33,741 - INFO - combo.training.trainer - Epoch duration: 0:01:05.076501\n", + "2023-04-06 23:06:33,741 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:16\n", + "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - Epoch 15/399\n", + "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:06:33,748 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9288, LAS: 0.8590, UEM: 0.4644, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3342, partial_loss/deprel_loss: 0.5915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6157, loss: 0.9118, batch_reg_loss: 0.0756, reg_loss: 0.0756 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9227, LAS: 0.8551, UEM: 0.4754, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4619, partial_loss/deprel_loss: 0.7155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.9390, batch_reg_loss: 0.0757, reg_loss: 0.0756 ||: 6%|6 | 6/95 [00:04<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9234, LAS: 0.8552, UEM: 0.5529, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4761, partial_loss/deprel_loss: 0.7624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7809, loss: 0.9247, batch_reg_loss: 0.0758, reg_loss: 0.0757 ||: 9%|9 | 9/95 [00:06<01:01, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9260, LAS: 0.8572, UEM: 0.5653, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3541, partial_loss/deprel_loss: 0.6327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6528, loss: 0.9133, batch_reg_loss: 0.0758, reg_loss: 0.0757 ||: 13%|#2 | 12/95 [00:08<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9186, LAS: 0.8482, UEM: 0.5590, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3758, partial_loss/deprel_loss: 0.6077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6373, loss: 0.9877, batch_reg_loss: 0.0759, reg_loss: 0.0757 ||: 17%|#6 | 16/95 [00:11<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9244, LAS: 0.8549, UEM: 0.5798, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.7005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7176, loss: 0.9355, batch_reg_loss: 0.0760, reg_loss: 0.0758 ||: 21%|##1 | 20/95 [00:13<00:50, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8450, UAS: 0.9241, LAS: 0.8542, UEM: 0.5484, LEM: 0.2661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7622, partial_loss/deprel_loss: 0.9469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9861, loss: 0.9463, batch_reg_loss: 0.0761, reg_loss: 0.0758 ||: 25%|##5 | 24/95 [00:15<00:45, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9218, LAS: 0.8524, UEM: 0.5621, LEM: 0.2783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5259, loss: 0.9628, batch_reg_loss: 0.0762, reg_loss: 0.0759 ||: 29%|##9 | 28/95 [00:18<00:43, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7785, UAS: 0.9227, LAS: 0.8543, UEM: 0.6101, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9559, partial_loss/deprel_loss: 1.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6691, loss: 0.9506, batch_reg_loss: 0.0762, reg_loss: 0.0759 ||: 33%|###2 | 31/95 [00:21<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9232, LAS: 0.8549, UEM: 0.6136, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.4036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4337, loss: 0.9453, batch_reg_loss: 0.0763, reg_loss: 0.0759 ||: 36%|###5 | 34/95 [00:23<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8518, UAS: 0.9206, LAS: 0.8518, UEM: 0.5920, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6710, partial_loss/deprel_loss: 0.8887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9216, loss: 0.9707, batch_reg_loss: 0.0764, reg_loss: 0.0760 ||: 40%|#### | 38/95 [00:25<00:37, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8388, UAS: 0.9188, LAS: 0.8498, UEM: 0.5726, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9090, partial_loss/deprel_loss: 1.0273, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0801, loss: 0.9862, batch_reg_loss: 0.0765, reg_loss: 0.0760 ||: 44%|####4 | 42/95 [00:28<00:35, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9197, LAS: 0.8510, UEM: 0.5769, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3747, partial_loss/deprel_loss: 0.6371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.9721, batch_reg_loss: 0.0765, reg_loss: 0.0761 ||: 47%|####7 | 45/95 [00:30<00:35, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7993, UAS: 0.9199, LAS: 0.8513, UEM: 0.5792, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4818, partial_loss/deprel_loss: 1.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4545, loss: 0.9709, batch_reg_loss: 0.0766, reg_loss: 0.0761 ||: 51%|##### | 48/95 [00:32<00:34, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.9192, LAS: 0.8503, UEM: 0.5732, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2909, partial_loss/deprel_loss: 1.3614, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4240, loss: 0.9733, batch_reg_loss: 0.0767, reg_loss: 0.0761 ||: 54%|#####3 | 51/95 [00:35<00:32, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8298, UAS: 0.9190, LAS: 0.8499, UEM: 0.5627, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9471, partial_loss/deprel_loss: 1.1233, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1648, loss: 0.9763, batch_reg_loss: 0.0768, reg_loss: 0.0762 ||: 57%|#####6 | 54/95 [00:37<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7755, UAS: 0.9179, LAS: 0.8488, UEM: 0.5505, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8752, partial_loss/deprel_loss: 1.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6692, loss: 0.9884, batch_reg_loss: 0.0768, reg_loss: 0.0762 ||: 61%|######1 | 58/95 [00:40<00:26, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9177, LAS: 0.8488, UEM: 0.5661, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1684, partial_loss/deprel_loss: 0.3627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.9884, batch_reg_loss: 0.0769, reg_loss: 0.0762 ||: 64%|######4 | 61/95 [00:42<00:25, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9166, LAS: 0.8477, UEM: 0.5528, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5622, partial_loss/deprel_loss: 0.8644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.9998, batch_reg_loss: 0.0770, reg_loss: 0.0763 ||: 68%|######8 | 65/95 [00:44<00:20, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9160, LAS: 0.8466, UEM: 0.5391, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9552, partial_loss/deprel_loss: 1.0026, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0702, loss: 1.0081, batch_reg_loss: 0.0771, reg_loss: 0.0763 ||: 73%|#######2 | 69/95 [00:46<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9163, LAS: 0.8468, UEM: 0.5345, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7857, partial_loss/deprel_loss: 0.9780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 1.0061, batch_reg_loss: 0.0772, reg_loss: 0.0764 ||: 77%|#######6 | 73/95 [00:49<00:13, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9161, LAS: 0.8465, UEM: 0.5242, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8016, partial_loss/deprel_loss: 0.9685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0124, loss: 1.0086, batch_reg_loss: 0.0773, reg_loss: 0.0764 ||: 81%|########1 | 77/95 [00:51<00:10, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8215, UAS: 0.9153, LAS: 0.8454, UEM: 0.5156, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9789, partial_loss/deprel_loss: 1.2141, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2444, loss: 1.0181, batch_reg_loss: 0.0774, reg_loss: 0.0765 ||: 85%|########5 | 81/95 [00:54<00:08, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9155, LAS: 0.8456, UEM: 0.5128, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3639, partial_loss/deprel_loss: 0.6349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 1.0161, batch_reg_loss: 0.0775, reg_loss: 0.0765 ||: 89%|########9 | 85/95 [00:56<00:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9155, LAS: 0.8454, UEM: 0.5119, LEM: 0.2650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.7593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7775, loss: 1.0191, batch_reg_loss: 0.0775, reg_loss: 0.0766 ||: 94%|#########3| 89/95 [01:00<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9154, LAS: 0.8452, UEM: 0.5062, LEM: 0.2609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8630, partial_loss/deprel_loss: 1.0097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0580, loss: 1.0202, batch_reg_loss: 0.0776, reg_loss: 0.0766 ||: 97%|#########6| 92/95 [01:02<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9157, LAS: 0.8456, UEM: 0.5057, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 1.0813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0948, loss: 1.0184, batch_reg_loss: 0.0777, reg_loss: 0.0766 ||: 100%|##########| 95/95 [01:04<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9157, LAS: 0.8456, UEM: 0.5057, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 1.0813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0948, loss: 1.0184, batch_reg_loss: 0.0777, reg_loss: 0.0766 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-06 23:07:38,192 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9231, LAS: 0.8549, UEM: 0.2597, LEM: 0.0747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8460, partial_loss/deprel_loss: 41.4560, partial_loss/cycle_loss: 0.0000, batch_loss: 33.3340, loss: 30.5996, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9399, LAS: 0.8781, UEM: 0.6512, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 18.9218, partial_loss/cycle_loss: 0.0000, batch_loss: 15.1820, loss: 25.0834, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:05, 1.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9336, LAS: 0.8698, UEM: 0.5862, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7833, partial_loss/deprel_loss: 31.7641, partial_loss/cycle_loss: 0.0000, batch_loss: 25.5679, loss: 27.7894, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9401, LAS: 0.8766, UEM: 0.6039, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5219, partial_loss/deprel_loss: 22.8067, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3497, loss: 25.6024, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9428, LAS: 0.8808, UEM: 0.6373, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2147, partial_loss/deprel_loss: 21.5416, partial_loss/cycle_loss: 0.0000, batch_loss: 17.2762, loss: 24.8455, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01it/s]\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - reg_loss | 0.077 | 0.000\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - UEM | 0.506 | 0.637\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - LEM | 0.260 | 0.358\n", + "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EM | 0.840 | 0.923\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.761 | 0.215\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - UAS | 0.916 | 0.943\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.081 | 21.542\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - loss | 1.018 | 24.845\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - LAS | 0.846 | 0.881\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:07:49,045 - INFO - combo.training.trainer - Epoch duration: 0:01:15.303924\n", + "2023-04-06 23:07:49,045 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:08\n", + "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - Epoch 16/399\n", + "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:07:49,051 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9318, LAS: 0.8614, UEM: 0.4894, LEM: 0.1965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4096, partial_loss/deprel_loss: 0.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6683, loss: 0.8488, batch_reg_loss: 0.0777, reg_loss: 0.0777 ||: 3%|3 | 3/95 [00:02<01:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9351, LAS: 0.8664, UEM: 0.5156, LEM: 0.2211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3136, partial_loss/deprel_loss: 0.5873, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6103, loss: 0.8393, batch_reg_loss: 0.0778, reg_loss: 0.0777 ||: 6%|6 | 6/95 [00:04<01:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8190, UAS: 0.9224, LAS: 0.8541, UEM: 0.4664, LEM: 0.2007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2185, partial_loss/deprel_loss: 1.1788, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2646, loss: 0.9456, batch_reg_loss: 0.0779, reg_loss: 0.0778 ||: 9%|9 | 9/95 [00:06<01:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7607, UAS: 0.9187, LAS: 0.8505, UEM: 0.4539, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8743, partial_loss/deprel_loss: 1.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7006, loss: 0.9853, batch_reg_loss: 0.0779, reg_loss: 0.0778 ||: 14%|#3 | 13/95 [00:08<00:56, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9187, LAS: 0.8500, UEM: 0.4268, LEM: 0.1787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6203, partial_loss/deprel_loss: 0.8485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.9889, batch_reg_loss: 0.0780, reg_loss: 0.0779 ||: 18%|#7 | 17/95 [00:11<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9209, LAS: 0.8532, UEM: 0.5132, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0836, partial_loss/deprel_loss: 0.2480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2932, loss: 0.9624, batch_reg_loss: 0.0781, reg_loss: 0.0779 ||: 21%|##1 | 20/95 [00:13<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9204, LAS: 0.8518, UEM: 0.4941, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5449, partial_loss/deprel_loss: 0.7685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8019, loss: 0.9736, batch_reg_loss: 0.0782, reg_loss: 0.0779 ||: 24%|##4 | 23/95 [00:16<00:54, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8178, UAS: 0.9184, LAS: 0.8495, UEM: 0.4660, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2759, partial_loss/deprel_loss: 1.2168, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3069, loss: 0.9971, batch_reg_loss: 0.0783, reg_loss: 0.0780 ||: 28%|##8 | 27/95 [00:18<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9170, LAS: 0.8477, UEM: 0.4600, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3825, partial_loss/deprel_loss: 0.7065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7200, loss: 1.0084, batch_reg_loss: 0.0783, reg_loss: 0.0780 ||: 32%|###1 | 30/95 [00:20<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9193, LAS: 0.8501, UEM: 0.4875, LEM: 0.2571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7251, partial_loss/deprel_loss: 0.9890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0146, loss: 0.9834, batch_reg_loss: 0.0784, reg_loss: 0.0780 ||: 35%|###4 | 33/95 [00:23<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9216, LAS: 0.8526, UEM: 0.4994, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.9620, batch_reg_loss: 0.0785, reg_loss: 0.0781 ||: 39%|###8 | 37/95 [00:25<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9241, LAS: 0.8557, UEM: 0.5129, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4850, partial_loss/deprel_loss: 0.7002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.9371, batch_reg_loss: 0.0786, reg_loss: 0.0781 ||: 43%|####3 | 41/95 [00:28<00:36, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7890, UAS: 0.9220, LAS: 0.8531, UEM: 0.5083, LEM: 0.2616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5592, partial_loss/deprel_loss: 1.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5060, loss: 0.9564, batch_reg_loss: 0.0786, reg_loss: 0.0782 ||: 47%|####7 | 45/95 [00:30<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9210, LAS: 0.8520, UEM: 0.5033, LEM: 0.2549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3487, partial_loss/deprel_loss: 0.6453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6647, loss: 0.9648, batch_reg_loss: 0.0787, reg_loss: 0.0782 ||: 52%|#####1 | 49/95 [00:33<00:29, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9236, LAS: 0.8552, UEM: 0.5331, LEM: 0.2771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1897, partial_loss/deprel_loss: 0.4239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4559, loss: 0.9363, batch_reg_loss: 0.0788, reg_loss: 0.0783 ||: 56%|#####5 | 53/95 [00:36<00:29, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8068, UAS: 0.9221, LAS: 0.8535, UEM: 0.5169, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3648, partial_loss/deprel_loss: 1.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3851, loss: 0.9517, batch_reg_loss: 0.0789, reg_loss: 0.0783 ||: 60%|###### | 57/95 [00:38<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9216, LAS: 0.8529, UEM: 0.5135, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.5904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6220, loss: 0.9594, batch_reg_loss: 0.0790, reg_loss: 0.0783 ||: 63%|######3 | 60/95 [00:40<00:23, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9202, LAS: 0.8514, UEM: 0.5009, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7087, partial_loss/deprel_loss: 0.8273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8826, loss: 0.9733, batch_reg_loss: 0.0790, reg_loss: 0.0784 ||: 67%|######7 | 64/95 [00:43<00:20, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8087, UAS: 0.9195, LAS: 0.8504, UEM: 0.4911, LEM: 0.2478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3806, partial_loss/deprel_loss: 1.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3796, loss: 0.9849, batch_reg_loss: 0.0791, reg_loss: 0.0784 ||: 72%|#######1 | 68/95 [00:46<00:17, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9189, LAS: 0.8495, UEM: 0.4932, LEM: 0.2464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.7526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.9879, batch_reg_loss: 0.0792, reg_loss: 0.0785 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9204, LAS: 0.8514, UEM: 0.5069, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 0.6245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6536, loss: 0.9719, batch_reg_loss: 0.0793, reg_loss: 0.0785 ||: 80%|######## | 76/95 [00:51<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7064, UAS: 0.9186, LAS: 0.8495, UEM: 0.5170, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9467, partial_loss/deprel_loss: 1.9418, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2222, loss: 0.9877, batch_reg_loss: 0.0794, reg_loss: 0.0785 ||: 83%|########3 | 79/95 [00:53<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9169, LAS: 0.8478, UEM: 0.5171, LEM: 0.2693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3720, partial_loss/deprel_loss: 0.6572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6795, loss: 1.0014, batch_reg_loss: 0.0794, reg_loss: 0.0786 ||: 86%|########6 | 82/95 [00:56<00:09, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9178, LAS: 0.8489, UEM: 0.5172, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4747, partial_loss/deprel_loss: 0.6203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.9920, batch_reg_loss: 0.0795, reg_loss: 0.0786 ||: 91%|######### | 86/95 [00:59<00:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7905, UAS: 0.9173, LAS: 0.8484, UEM: 0.5160, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4908, partial_loss/deprel_loss: 1.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4706, loss: 0.9963, batch_reg_loss: 0.0796, reg_loss: 0.0786 ||: 94%|#########3| 89/95 [01:01<00:04, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8267, UAS: 0.9177, LAS: 0.8486, UEM: 0.5121, LEM: 0.2636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8148, partial_loss/deprel_loss: 1.1143, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1341, loss: 0.9947, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||: 97%|#########6| 92/95 [01:03<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8112, UAS: 0.9175, LAS: 0.8483, UEM: 0.5078, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1950, partial_loss/deprel_loss: 1.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3345, loss: 0.9974, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||: 100%|##########| 95/95 [01:05<00:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8112, UAS: 0.9175, LAS: 0.8483, UEM: 0.5078, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1950, partial_loss/deprel_loss: 1.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3345, loss: 0.9974, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - reg_loss | 0.079 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UEM | 0.508 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - LEM | 0.260 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EM | 0.811 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.195 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UAS | 0.918 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.270 | N/A\n", + "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - loss | 0.997 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - LAS | 0.848 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:54,696 - INFO - combo.training.trainer - Epoch duration: 0:01:05.651487\n", + "2023-04-06 23:08:54,697 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:00\n", + "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - Epoch 17/399\n", + "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:08:54,702 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8211, UAS: 0.9094, LAS: 0.8421, UEM: 0.4571, LEM: 0.2251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2175, partial_loss/deprel_loss: 1.1695, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2589, loss: 1.0662, batch_reg_loss: 0.0798, reg_loss: 0.0798 ||: 3%|3 | 3/95 [00:02<01:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9177, LAS: 0.8486, UEM: 0.4710, LEM: 0.2165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6351, partial_loss/deprel_loss: 0.8392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8782, loss: 1.0078, batch_reg_loss: 0.0799, reg_loss: 0.0798 ||: 7%|7 | 7/95 [00:04<01:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9255, LAS: 0.8579, UEM: 0.4782, LEM: 0.2083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2571, partial_loss/deprel_loss: 0.5411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5643, loss: 0.9388, batch_reg_loss: 0.0800, reg_loss: 0.0799 ||: 12%|#1 | 11/95 [00:07<00:59, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9292, LAS: 0.8630, UEM: 0.5108, LEM: 0.2318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6941, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9013, loss: 0.8938, batch_reg_loss: 0.0800, reg_loss: 0.0799 ||: 15%|#4 | 14/95 [00:09<00:56, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9276, LAS: 0.8610, UEM: 0.4956, LEM: 0.2220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4762, partial_loss/deprel_loss: 0.7494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7748, loss: 0.9064, batch_reg_loss: 0.0801, reg_loss: 0.0799 ||: 18%|#7 | 17/95 [00:12<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9244, LAS: 0.8568, UEM: 0.4666, LEM: 0.2043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7222, partial_loss/deprel_loss: 0.8504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9049, loss: 0.9373, batch_reg_loss: 0.0802, reg_loss: 0.0800 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8657, UAS: 0.9269, LAS: 0.8603, UEM: 0.5326, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5957, partial_loss/deprel_loss: 0.7876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8294, loss: 0.9040, batch_reg_loss: 0.0802, reg_loss: 0.0800 ||: 24%|##4 | 23/95 [00:16<00:54, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9240, LAS: 0.8568, UEM: 0.5163, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9524, partial_loss/deprel_loss: 1.0799, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1347, loss: 0.9328, batch_reg_loss: 0.0803, reg_loss: 0.0800 ||: 27%|##7 | 26/95 [00:18<00:50, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9238, LAS: 0.8563, UEM: 0.5109, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8677, partial_loss/deprel_loss: 1.1584, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1806, loss: 0.9377, batch_reg_loss: 0.0804, reg_loss: 0.0801 ||: 31%|### | 29/95 [00:21<00:49, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9227, LAS: 0.8549, UEM: 0.5017, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5467, partial_loss/deprel_loss: 0.7827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8159, loss: 0.9461, batch_reg_loss: 0.0804, reg_loss: 0.0801 ||: 35%|###4 | 33/95 [00:23<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9224, LAS: 0.8544, UEM: 0.4874, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4548, partial_loss/deprel_loss: 0.7003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7317, loss: 0.9517, batch_reg_loss: 0.0805, reg_loss: 0.0801 ||: 39%|###8 | 37/95 [00:25<00:38, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9221, LAS: 0.8539, UEM: 0.4947, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7679, loss: 0.9597, batch_reg_loss: 0.0806, reg_loss: 0.0802 ||: 43%|####3 | 41/95 [00:28<00:36, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8369, UAS: 0.9180, LAS: 0.8491, UEM: 0.4773, LEM: 0.2463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8364, partial_loss/deprel_loss: 0.9655, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0204, loss: 1.0019, batch_reg_loss: 0.0807, reg_loss: 0.0802 ||: 47%|####7 | 45/95 [00:30<00:32, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9179, LAS: 0.8491, UEM: 0.4911, LEM: 0.2535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 0.9998, batch_reg_loss: 0.0808, reg_loss: 0.0803 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9195, LAS: 0.8512, UEM: 0.4988, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.7183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7646, loss: 0.9834, batch_reg_loss: 0.0809, reg_loss: 0.0803 ||: 55%|#####4 | 52/95 [00:35<00:29, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9200, LAS: 0.8515, UEM: 0.4981, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0464, partial_loss/deprel_loss: 1.1652, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2224, loss: 0.9811, batch_reg_loss: 0.0810, reg_loss: 0.0803 ||: 58%|#####7 | 55/95 [00:37<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.9196, LAS: 0.8511, UEM: 0.4950, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5286, partial_loss/deprel_loss: 1.3468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4642, loss: 0.9830, batch_reg_loss: 0.0810, reg_loss: 0.0804 ||: 61%|######1 | 58/95 [00:40<00:25, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9208, LAS: 0.8526, UEM: 0.5058, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5972, partial_loss/deprel_loss: 0.8106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.9690, batch_reg_loss: 0.0811, reg_loss: 0.0804 ||: 64%|######4 | 61/95 [00:42<00:24, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9221, LAS: 0.8539, UEM: 0.5137, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8451, partial_loss/deprel_loss: 0.9112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9792, loss: 0.9557, batch_reg_loss: 0.0812, reg_loss: 0.0805 ||: 68%|######8 | 65/95 [00:45<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9227, LAS: 0.8548, UEM: 0.5225, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8310, partial_loss/deprel_loss: 1.0333, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0741, loss: 0.9481, batch_reg_loss: 0.0812, reg_loss: 0.0805 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9229, LAS: 0.8549, UEM: 0.5200, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3519, partial_loss/deprel_loss: 0.5175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5657, loss: 0.9448, batch_reg_loss: 0.0813, reg_loss: 0.0805 ||: 76%|#######5 | 72/95 [00:49<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9218, LAS: 0.8536, UEM: 0.5125, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5668, partial_loss/deprel_loss: 0.7364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7839, loss: 0.9564, batch_reg_loss: 0.0814, reg_loss: 0.0806 ||: 80%|######## | 76/95 [00:52<00:12, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8361, UAS: 0.9197, LAS: 0.8512, UEM: 0.5029, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8183, partial_loss/deprel_loss: 1.0178, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0594, loss: 0.9775, batch_reg_loss: 0.0815, reg_loss: 0.0806 ||: 84%|########4 | 80/95 [00:54<00:09, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9204, LAS: 0.8520, UEM: 0.5089, LEM: 0.2557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3322, partial_loss/deprel_loss: 0.6043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6315, loss: 0.9704, batch_reg_loss: 0.0816, reg_loss: 0.0807 ||: 88%|########8 | 84/95 [00:57<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7638, UAS: 0.9197, LAS: 0.8513, UEM: 0.5099, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8641, partial_loss/deprel_loss: 1.5048, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6583, loss: 0.9760, batch_reg_loss: 0.0816, reg_loss: 0.0807 ||: 92%|#########1| 87/95 [01:00<00:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9207, LAS: 0.8525, UEM: 0.5240, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3733, loss: 0.9655, batch_reg_loss: 0.0817, reg_loss: 0.0807 ||: 95%|#########4| 90/95 [01:02<00:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8265, UAS: 0.9196, LAS: 0.8512, UEM: 0.5187, LEM: 0.2684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0582, partial_loss/deprel_loss: 1.0256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1139, loss: 0.9761, batch_reg_loss: 0.0818, reg_loss: 0.0808 ||: 98%|#########7| 93/95 [01:04<00:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9198, LAS: 0.8514, UEM: 0.5192, LEM: 0.2679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3025, partial_loss/deprel_loss: 0.5928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6165, loss: 0.9746, batch_reg_loss: 0.0818, reg_loss: 0.0808 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - reg_loss | 0.081 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UEM | 0.519 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - LEM | 0.268 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EM | 0.899 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.302 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UAS | 0.920 | N/A\n", + "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.593 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - loss | 0.975 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - LAS | 0.851 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:10:00,783 - INFO - combo.training.trainer - Epoch duration: 0:01:06.086857\n", + "2023-04-06 23:10:00,784 - INFO - combo.training.trainer - Estimated training time remaining: 7:13:08\n", + "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - Epoch 18/399\n", + "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:10:00,790 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8063, UAS: 0.9016, LAS: 0.8326, UEM: 0.3613, LEM: 0.1450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3579, partial_loss/deprel_loss: 1.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 1.1402, batch_reg_loss: 0.0819, reg_loss: 0.0819 ||: 4%|4 | 4/95 [00:02<00:57, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9147, LAS: 0.8475, UEM: 0.4064, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6307, partial_loss/deprel_loss: 0.8028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8504, loss: 1.0049, batch_reg_loss: 0.0820, reg_loss: 0.0819 ||: 8%|8 | 8/95 [00:05<00:55, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9260, LAS: 0.8603, UEM: 0.5197, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.4959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.9117, batch_reg_loss: 0.0821, reg_loss: 0.0820 ||: 13%|#2 | 12/95 [00:07<00:53, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9277, LAS: 0.8604, UEM: 0.5508, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3392, partial_loss/deprel_loss: 0.6802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6942, loss: 0.9067, batch_reg_loss: 0.0822, reg_loss: 0.0820 ||: 16%|#5 | 15/95 [00:09<00:52, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9241, LAS: 0.8566, UEM: 0.5429, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2321, partial_loss/deprel_loss: 1.1701, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2647, loss: 0.9299, batch_reg_loss: 0.0822, reg_loss: 0.0820 ||: 19%|#8 | 18/95 [00:12<00:52, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9226, LAS: 0.8539, UEM: 0.5082, LEM: 0.2467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7400, partial_loss/deprel_loss: 0.9208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9670, loss: 0.9604, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||: 23%|##3 | 22/95 [00:14<00:47, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8159, UAS: 0.9219, LAS: 0.8527, UEM: 0.4923, LEM: 0.2314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1987, partial_loss/deprel_loss: 1.2112, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2911, loss: 0.9728, batch_reg_loss: 0.0824, reg_loss: 0.0821 ||: 26%|##6 | 25/95 [00:16<00:46, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8190, UAS: 0.9208, LAS: 0.8517, UEM: 0.4836, LEM: 0.2277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2457, partial_loss/deprel_loss: 1.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2364, loss: 0.9771, batch_reg_loss: 0.0824, reg_loss: 0.0821 ||: 29%|##9 | 28/95 [00:18<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9225, LAS: 0.8538, UEM: 0.4998, LEM: 0.2389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3777, partial_loss/deprel_loss: 0.6058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.9584, batch_reg_loss: 0.0825, reg_loss: 0.0822 ||: 33%|###2 | 31/95 [00:20<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9247, LAS: 0.8565, UEM: 0.5108, LEM: 0.2453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2491, partial_loss/deprel_loss: 0.4766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.9393, batch_reg_loss: 0.0826, reg_loss: 0.0822 ||: 37%|###6 | 35/95 [00:23<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9260, LAS: 0.8585, UEM: 0.5073, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5593, partial_loss/deprel_loss: 0.7965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8317, loss: 0.9242, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||: 41%|####1 | 39/95 [00:26<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9277, LAS: 0.8603, UEM: 0.5189, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4367, partial_loss/deprel_loss: 0.6974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7280, loss: 0.9088, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||: 44%|####4 | 42/95 [00:28<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7823, UAS: 0.9266, LAS: 0.8590, UEM: 0.5181, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6739, partial_loss/deprel_loss: 1.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6553, loss: 0.9214, batch_reg_loss: 0.0828, reg_loss: 0.0823 ||: 47%|####7 | 45/95 [00:30<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9271, LAS: 0.8590, UEM: 0.5167, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.5809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6167, loss: 0.9202, batch_reg_loss: 0.0829, reg_loss: 0.0824 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9254, LAS: 0.8574, UEM: 0.5037, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6386, partial_loss/deprel_loss: 0.8472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8885, loss: 0.9353, batch_reg_loss: 0.0830, reg_loss: 0.0824 ||: 56%|#####5 | 53/95 [00:35<00:27, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9235, LAS: 0.8553, UEM: 0.5002, LEM: 0.2311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.9538, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||: 60%|###### | 57/95 [00:37<00:24, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9217, LAS: 0.8532, UEM: 0.4937, LEM: 0.2270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6313, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.9686, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||: 64%|######4 | 61/95 [00:40<00:21, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9221, LAS: 0.8537, UEM: 0.5130, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8276, partial_loss/deprel_loss: 1.0782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1113, loss: 0.9656, batch_reg_loss: 0.0832, reg_loss: 0.0825 ||: 68%|######8 | 65/95 [00:43<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9227, LAS: 0.8546, UEM: 0.5260, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3946, partial_loss/deprel_loss: 0.6266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6635, loss: 0.9557, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||: 72%|#######1 | 68/95 [00:46<00:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8142, UAS: 0.9225, LAS: 0.8545, UEM: 0.5218, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3803, partial_loss/deprel_loss: 1.2825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3855, loss: 0.9600, batch_reg_loss: 0.0834, reg_loss: 0.0826 ||: 75%|#######4 | 71/95 [00:48<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7495, UAS: 0.9206, LAS: 0.8526, UEM: 0.5165, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2523, partial_loss/deprel_loss: 1.6199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8299, loss: 0.9755, batch_reg_loss: 0.0835, reg_loss: 0.0826 ||: 78%|#######7 | 74/95 [00:50<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9207, LAS: 0.8526, UEM: 0.5172, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.7071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.9738, batch_reg_loss: 0.0835, reg_loss: 0.0827 ||: 82%|########2 | 78/95 [00:53<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7802, UAS: 0.9204, LAS: 0.8522, UEM: 0.5150, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7017, partial_loss/deprel_loss: 1.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5967, loss: 0.9763, batch_reg_loss: 0.0836, reg_loss: 0.0827 ||: 86%|########6 | 82/95 [00:55<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9201, LAS: 0.8519, UEM: 0.5133, LEM: 0.2586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8410, partial_loss/deprel_loss: 0.9424, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0059, loss: 0.9782, batch_reg_loss: 0.0837, reg_loss: 0.0828 ||: 91%|######### | 86/95 [00:58<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9205, LAS: 0.8524, UEM: 0.5166, LEM: 0.2627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.8882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9179, loss: 0.9757, batch_reg_loss: 0.0838, reg_loss: 0.0828 ||: 95%|#########4| 90/95 [01:00<00:03, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9208, LAS: 0.8527, UEM: 0.5221, LEM: 0.2707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7381, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0161, loss: 0.9715, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||: 99%|#########8| 94/95 [01:02<00:00, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8543, UAS: 0.9209, LAS: 0.8527, UEM: 0.5206, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6922, partial_loss/deprel_loss: 0.8876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9324, loss: 0.9711, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - reg_loss | 0.083 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - UEM | 0.521 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - LEM | 0.269 | N/A\n", + "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EM | 0.854 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.692 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - UAS | 0.921 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.888 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - loss | 0.971 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - LAS | 0.853 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:11:04,382 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:11:04,382 - INFO - combo.training.trainer - Epoch duration: 0:01:03.598358\n", + "2023-04-06 23:11:04,382 - INFO - combo.training.trainer - Estimated training time remaining: 7:10:31\n", + "2023-04-06 23:11:04,382 - INFO - allennlp.training.trainer - Epoch 19/399\n", + "2023-04-06 23:11:04,382 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:11:04,383 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:11:04,388 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9435, LAS: 0.8860, UEM: 0.7204, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9285, partial_loss/deprel_loss: 1.0618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1192, loss: 0.6993, batch_reg_loss: 0.0840, reg_loss: 0.0840 ||: 3%|3 | 3/95 [00:02<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8009, UAS: 0.9156, LAS: 0.8519, UEM: 0.5387, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6037, partial_loss/deprel_loss: 1.2293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3883, loss: 0.9807, batch_reg_loss: 0.0841, reg_loss: 0.0840 ||: 7%|7 | 7/95 [00:04<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9223, LAS: 0.8586, UEM: 0.5432, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3469, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.9240, batch_reg_loss: 0.0841, reg_loss: 0.0840 ||: 11%|# | 10/95 [00:07<01:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9256, LAS: 0.8612, UEM: 0.5207, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8806, partial_loss/deprel_loss: 0.9421, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0140, loss: 0.8929, batch_reg_loss: 0.0842, reg_loss: 0.0841 ||: 15%|#4 | 14/95 [00:09<00:57, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7806, UAS: 0.9192, LAS: 0.8538, UEM: 0.5271, LEM: 0.2799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6357, partial_loss/deprel_loss: 1.4219, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5490, loss: 0.9499, batch_reg_loss: 0.0843, reg_loss: 0.0841 ||: 19%|#8 | 18/95 [00:12<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9156, LAS: 0.8487, UEM: 0.4943, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5104, partial_loss/deprel_loss: 0.7872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.9940, batch_reg_loss: 0.0844, reg_loss: 0.0842 ||: 23%|##3 | 22/95 [00:14<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9168, LAS: 0.8503, UEM: 0.4811, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7056, partial_loss/deprel_loss: 0.8735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9244, loss: 0.9825, batch_reg_loss: 0.0845, reg_loss: 0.0842 ||: 26%|##6 | 25/95 [00:16<00:46, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9175, LAS: 0.8506, UEM: 0.4635, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4135, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 0.9775, batch_reg_loss: 0.0846, reg_loss: 0.0843 ||: 31%|### | 29/95 [00:18<00:41, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9197, LAS: 0.8531, UEM: 0.4805, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.6840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7122, loss: 0.9550, batch_reg_loss: 0.0847, reg_loss: 0.0843 ||: 35%|###4 | 33/95 [00:21<00:40, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9224, LAS: 0.8559, UEM: 0.5072, LEM: 0.2469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5645, loss: 0.9343, batch_reg_loss: 0.0848, reg_loss: 0.0844 ||: 39%|###8 | 37/95 [00:24<00:39, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9217, LAS: 0.8554, UEM: 0.4989, LEM: 0.2412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5131, partial_loss/deprel_loss: 0.6908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7401, loss: 0.9416, batch_reg_loss: 0.0849, reg_loss: 0.0844 ||: 42%|####2 | 40/95 [00:26<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9233, LAS: 0.8573, UEM: 0.5106, LEM: 0.2486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9475, partial_loss/deprel_loss: 1.0811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1393, loss: 0.9286, batch_reg_loss: 0.0849, reg_loss: 0.0844 ||: 45%|####5 | 43/95 [00:28<00:36, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9236, LAS: 0.8577, UEM: 0.5018, LEM: 0.2420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9378, partial_loss/deprel_loss: 0.9711, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0495, loss: 0.9265, batch_reg_loss: 0.0850, reg_loss: 0.0845 ||: 48%|####8 | 46/95 [00:31<00:34, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9245, LAS: 0.8588, UEM: 0.5113, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.5103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5608, loss: 0.9145, batch_reg_loss: 0.0851, reg_loss: 0.0845 ||: 52%|#####1 | 49/95 [00:33<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9246, LAS: 0.8589, UEM: 0.5174, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4168, partial_loss/deprel_loss: 0.7370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7581, loss: 0.9116, batch_reg_loss: 0.0851, reg_loss: 0.0845 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9250, LAS: 0.8593, UEM: 0.5118, LEM: 0.2468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7121, partial_loss/deprel_loss: 0.8879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9379, loss: 0.9107, batch_reg_loss: 0.0852, reg_loss: 0.0846 ||: 59%|#####8 | 56/95 [00:37<00:26, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9247, LAS: 0.8590, UEM: 0.5060, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1599, partial_loss/deprel_loss: 1.1592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2446, loss: 0.9141, batch_reg_loss: 0.0853, reg_loss: 0.0846 ||: 62%|######2 | 59/95 [00:39<00:24, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8143, UAS: 0.9251, LAS: 0.8594, UEM: 0.5113, LEM: 0.2465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3870, partial_loss/deprel_loss: 1.3038, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4058, loss: 0.9143, batch_reg_loss: 0.0853, reg_loss: 0.0846 ||: 65%|######5 | 62/95 [00:42<00:23, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9266, LAS: 0.8613, UEM: 0.5381, LEM: 0.2765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1560, partial_loss/deprel_loss: 0.3884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4274, loss: 0.8983, batch_reg_loss: 0.0854, reg_loss: 0.0847 ||: 69%|######9 | 66/95 [00:44<00:20, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9263, LAS: 0.8610, UEM: 0.5383, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.4687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.9019, batch_reg_loss: 0.0855, reg_loss: 0.0847 ||: 73%|#######2 | 69/95 [00:47<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9269, LAS: 0.8615, UEM: 0.5384, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4765, partial_loss/deprel_loss: 0.6877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7310, loss: 0.8967, batch_reg_loss: 0.0855, reg_loss: 0.0848 ||: 76%|#######5 | 72/95 [00:49<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8586, UAS: 0.9264, LAS: 0.8608, UEM: 0.5295, LEM: 0.2685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.8600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 0.9015, batch_reg_loss: 0.0856, reg_loss: 0.0848 ||: 80%|######## | 76/95 [00:51<00:12, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7132, UAS: 0.9240, LAS: 0.8580, UEM: 0.5249, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6995, partial_loss/deprel_loss: 1.8867, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1350, loss: 0.9255, batch_reg_loss: 0.0857, reg_loss: 0.0848 ||: 84%|########4 | 80/95 [00:53<00:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8211, UAS: 0.9225, LAS: 0.8562, UEM: 0.5163, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0998, partial_loss/deprel_loss: 1.1962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2627, loss: 0.9415, batch_reg_loss: 0.0858, reg_loss: 0.0849 ||: 88%|########8 | 84/95 [00:56<00:07, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9213, LAS: 0.8547, UEM: 0.5081, LEM: 0.2550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2418, partial_loss/deprel_loss: 1.2224, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3122, loss: 0.9540, batch_reg_loss: 0.0859, reg_loss: 0.0849 ||: 93%|#########2| 88/95 [00:59<00:04, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9229, LAS: 0.8565, UEM: 0.5315, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4410, partial_loss/deprel_loss: 0.8339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8413, loss: 0.9397, batch_reg_loss: 0.0860, reg_loss: 0.0850 ||: 97%|#########6| 92/95 [01:02<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9226, LAS: 0.8561, UEM: 0.5297, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.6098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.9430, batch_reg_loss: 0.0861, reg_loss: 0.0850 ||: 100%|##########| 95/95 [01:04<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9226, LAS: 0.8561, UEM: 0.5297, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.6098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.9430, batch_reg_loss: 0.0861, reg_loss: 0.0850 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - reg_loss | 0.085 | N/A\n", + "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UEM | 0.530 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LEM | 0.278 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - EM | 0.890 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.354 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UAS | 0.923 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.610 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - loss | 0.943 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LAS | 0.856 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.325 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:08,725 - INFO - combo.training.trainer - Epoch duration: 0:01:04.342871\n", + "2023-04-06 23:12:08,725 - INFO - combo.training.trainer - Estimated training time remaining: 7:08:17\n", + "2023-04-06 23:12:08,725 - INFO - allennlp.training.trainer - Epoch 20/399\n", + "2023-04-06 23:12:08,725 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:12:08,726 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:12:08,732 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9110, LAS: 0.8443, UEM: 0.3849, LEM: 0.1702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2972, partial_loss/deprel_loss: 0.5319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 1.0397, batch_reg_loss: 0.0862, reg_loss: 0.0861 ||: 4%|4 | 4/95 [00:02<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9310, LAS: 0.8659, UEM: 0.5533, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3611, partial_loss/deprel_loss: 0.5817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.8645, batch_reg_loss: 0.0862, reg_loss: 0.0862 ||: 8%|8 | 8/95 [00:05<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9336, LAS: 0.8679, UEM: 0.5478, LEM: 0.2519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4877, partial_loss/deprel_loss: 0.6900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7359, loss: 0.8320, batch_reg_loss: 0.0863, reg_loss: 0.0862 ||: 12%|#1 | 11/95 [00:07<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9324, LAS: 0.8653, UEM: 0.5534, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.6690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7038, loss: 0.8553, batch_reg_loss: 0.0864, reg_loss: 0.0862 ||: 16%|#5 | 15/95 [00:09<00:51, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9284, LAS: 0.8616, UEM: 0.5068, LEM: 0.2273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1938, partial_loss/deprel_loss: 1.0830, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1916, loss: 0.8870, batch_reg_loss: 0.0865, reg_loss: 0.0863 ||: 20%|## | 19/95 [00:12<00:47, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9314, LAS: 0.8659, UEM: 0.5482, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6033, partial_loss/deprel_loss: 0.7846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8348, loss: 0.8500, batch_reg_loss: 0.0865, reg_loss: 0.0863 ||: 23%|##3 | 22/95 [00:14<00:51, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9259, LAS: 0.8598, UEM: 0.5101, LEM: 0.2451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9727, partial_loss/deprel_loss: 1.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1570, loss: 0.9070, batch_reg_loss: 0.0866, reg_loss: 0.0864 ||: 27%|##7 | 26/95 [00:17<00:46, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9231, LAS: 0.8571, UEM: 0.4837, LEM: 0.2284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5614, partial_loss/deprel_loss: 0.6820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7446, loss: 0.9337, batch_reg_loss: 0.0867, reg_loss: 0.0864 ||: 32%|###1 | 30/95 [00:19<00:42, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9254, LAS: 0.8596, UEM: 0.5063, LEM: 0.2410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6332, loss: 0.9123, batch_reg_loss: 0.0868, reg_loss: 0.0864 ||: 35%|###4 | 33/95 [00:22<00:43, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7897, UAS: 0.9223, LAS: 0.8554, UEM: 0.4936, LEM: 0.2330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7403, partial_loss/deprel_loss: 1.4286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5778, loss: 0.9495, batch_reg_loss: 0.0869, reg_loss: 0.0865 ||: 39%|###8 | 37/95 [00:24<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9210, LAS: 0.8539, UEM: 0.4811, LEM: 0.2228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5754, partial_loss/deprel_loss: 0.8188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8571, loss: 0.9656, batch_reg_loss: 0.0870, reg_loss: 0.0865 ||: 43%|####3 | 41/95 [00:26<00:35, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9231, LAS: 0.8565, UEM: 0.5083, LEM: 0.2521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1527, partial_loss/deprel_loss: 0.4154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.9443, batch_reg_loss: 0.0871, reg_loss: 0.0866 ||: 47%|####7 | 45/95 [00:29<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9231, LAS: 0.8567, UEM: 0.5003, LEM: 0.2448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7734, partial_loss/deprel_loss: 0.9690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0170, loss: 0.9441, batch_reg_loss: 0.0871, reg_loss: 0.0866 ||: 51%|##### | 48/95 [00:31<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9250, LAS: 0.8595, UEM: 0.5372, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.9245, batch_reg_loss: 0.0872, reg_loss: 0.0866 ||: 54%|#####3 | 51/95 [00:34<00:31, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9266, LAS: 0.8612, UEM: 0.5460, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3473, partial_loss/deprel_loss: 0.5949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6327, loss: 0.9112, batch_reg_loss: 0.0873, reg_loss: 0.0867 ||: 57%|#####6 | 54/95 [00:36<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9251, LAS: 0.8595, UEM: 0.5404, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0079, partial_loss/deprel_loss: 0.9937, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.9280, batch_reg_loss: 0.0874, reg_loss: 0.0867 ||: 61%|######1 | 58/95 [00:38<00:24, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9247, LAS: 0.8591, UEM: 0.5448, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.7013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7582, loss: 0.9304, batch_reg_loss: 0.0874, reg_loss: 0.0868 ||: 65%|######5 | 62/95 [00:41<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8300, UAS: 0.9228, LAS: 0.8570, UEM: 0.5325, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0626, partial_loss/deprel_loss: 1.0727, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1582, loss: 0.9464, batch_reg_loss: 0.0875, reg_loss: 0.0868 ||: 69%|######9 | 66/95 [00:44<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9230, LAS: 0.8569, UEM: 0.5244, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.7219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7614, loss: 0.9487, batch_reg_loss: 0.0876, reg_loss: 0.0868 ||: 74%|#######3 | 70/95 [00:47<00:17, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9237, LAS: 0.8577, UEM: 0.5248, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4907, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7911, loss: 0.9429, batch_reg_loss: 0.0877, reg_loss: 0.0869 ||: 77%|#######6 | 73/95 [00:49<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9242, LAS: 0.8581, UEM: 0.5217, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.6355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6667, loss: 0.9388, batch_reg_loss: 0.0878, reg_loss: 0.0869 ||: 81%|########1 | 77/95 [00:51<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7475, UAS: 0.9237, LAS: 0.8577, UEM: 0.5224, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3742, partial_loss/deprel_loss: 1.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8683, loss: 0.9423, batch_reg_loss: 0.0879, reg_loss: 0.0870 ||: 85%|########5 | 81/95 [00:54<00:09, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9248, LAS: 0.8591, UEM: 0.5373, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6663, partial_loss/deprel_loss: 0.7912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.9301, batch_reg_loss: 0.0879, reg_loss: 0.0870 ||: 88%|########8 | 84/95 [00:56<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7260, UAS: 0.9236, LAS: 0.8578, UEM: 0.5355, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6770, partial_loss/deprel_loss: 1.8716, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1207, loss: 0.9407, batch_reg_loss: 0.0880, reg_loss: 0.0870 ||: 92%|#########1| 87/95 [00:58<00:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9228, LAS: 0.8568, UEM: 0.5279, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9349, partial_loss/deprel_loss: 1.0539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1182, loss: 0.9479, batch_reg_loss: 0.0881, reg_loss: 0.0871 ||: 95%|#########4| 90/95 [01:00<00:03, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9235, LAS: 0.8578, UEM: 0.5311, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7756, partial_loss/deprel_loss: 0.8687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9383, loss: 0.9384, batch_reg_loss: 0.0882, reg_loss: 0.0871 ||: 99%|#########8| 94/95 [01:03<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9237, LAS: 0.8579, UEM: 0.5307, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5919, partial_loss/deprel_loss: 0.8331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8731, loss: 0.9377, batch_reg_loss: 0.0882, reg_loss: 0.0871 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-06 23:13:12,510 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9319, LAS: 0.8801, UEM: 0.7776, LEM: 0.6212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2257, partial_loss/deprel_loss: 19.5722, partial_loss/cycle_loss: 0.0000, batch_loss: 15.7029, loss: 30.2250, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.08s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9292, LAS: 0.8706, UEM: 0.5947, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7996, partial_loss/deprel_loss: 32.6935, partial_loss/cycle_loss: 0.0000, batch_loss: 26.3147, loss: 28.7042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:06, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9410, LAS: 0.8846, UEM: 0.6785, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 23.8122, partial_loss/cycle_loss: 0.0000, batch_loss: 19.1238, loss: 25.7829, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:06<00:04, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9433, LAS: 0.8857, UEM: 0.6618, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3140, partial_loss/deprel_loss: 27.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 22.0972, loss: 26.3043, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9434, LAS: 0.8851, UEM: 0.6533, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5105, partial_loss/deprel_loss: 23.3250, partial_loss/cycle_loss: 0.0000, batch_loss: 18.7621, loss: 25.6187, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.13it/s]\n", + "2023-04-06 23:13:22,264 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - reg_loss | 0.087 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UEM | 0.531 | 0.653\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - LEM | 0.278 | 0.374\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EM | 0.870 | 0.879\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.592 | 0.510\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UAS | 0.924 | 0.943\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.833 | 23.325\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - loss | 0.938 | 25.619\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - LAS | 0.858 | 0.885\n", + "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.trainer - Epoch duration: 0:01:13.540946\n", + "2023-04-06 23:13:22,266 - INFO - combo.training.trainer - Estimated training time remaining: 7:08:57\n", + "2023-04-06 23:13:22,266 - INFO - allennlp.training.trainer - Epoch 21/399\n", + "2023-04-06 23:13:22,267 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:13:22,267 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:13:22,273 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9221, LAS: 0.8546, UEM: 0.3557, LEM: 0.1229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4082, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7001, loss: 0.9470, batch_reg_loss: 0.0883, reg_loss: 0.0882 ||: 4%|4 | 4/95 [00:02<00:54, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9199, LAS: 0.8541, UEM: 0.3511, LEM: 0.1239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9181, partial_loss/deprel_loss: 1.0244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0915, loss: 0.9805, batch_reg_loss: 0.0883, reg_loss: 0.0883 ||: 7%|7 | 7/95 [00:04<00:58, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9295, LAS: 0.8663, UEM: 0.6005, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0708, partial_loss/deprel_loss: 0.2353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2908, loss: 0.8785, batch_reg_loss: 0.0884, reg_loss: 0.0883 ||: 11%|# | 10/95 [00:07<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8384, UAS: 0.9190, LAS: 0.8538, UEM: 0.5549, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9296, partial_loss/deprel_loss: 1.0548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1183, loss: 0.9701, batch_reg_loss: 0.0885, reg_loss: 0.0883 ||: 14%|#3 | 13/95 [00:09<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9230, LAS: 0.8573, UEM: 0.5473, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.8580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8901, loss: 0.9454, batch_reg_loss: 0.0886, reg_loss: 0.0884 ||: 18%|#7 | 17/95 [00:11<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9273, LAS: 0.8625, UEM: 0.5692, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2405, partial_loss/deprel_loss: 0.4936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.9059, batch_reg_loss: 0.0887, reg_loss: 0.0884 ||: 22%|##2 | 21/95 [00:14<00:48, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9278, LAS: 0.8636, UEM: 0.5645, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2945, partial_loss/deprel_loss: 0.5534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5904, loss: 0.9013, batch_reg_loss: 0.0887, reg_loss: 0.0885 ||: 25%|##5 | 24/95 [00:16<00:47, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9298, LAS: 0.8662, UEM: 0.5759, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.8804, batch_reg_loss: 0.0888, reg_loss: 0.0885 ||: 29%|##9 | 28/95 [00:19<00:44, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9313, LAS: 0.8677, UEM: 0.5794, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2287, partial_loss/deprel_loss: 0.4578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.8691, batch_reg_loss: 0.0889, reg_loss: 0.0886 ||: 33%|###2 | 31/95 [00:21<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9322, LAS: 0.8694, UEM: 0.5735, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.6444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.8587, batch_reg_loss: 0.0890, reg_loss: 0.0886 ||: 36%|###5 | 34/95 [00:23<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9288, LAS: 0.8655, UEM: 0.5588, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5252, partial_loss/deprel_loss: 0.7641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8053, loss: 0.8868, batch_reg_loss: 0.0890, reg_loss: 0.0886 ||: 39%|###8 | 37/95 [00:25<00:40, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9269, LAS: 0.8634, UEM: 0.5501, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8205, partial_loss/deprel_loss: 0.9077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9794, loss: 0.9034, batch_reg_loss: 0.0891, reg_loss: 0.0887 ||: 42%|####2 | 40/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9280, LAS: 0.8645, UEM: 0.5619, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5773, partial_loss/deprel_loss: 0.7543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8081, loss: 0.8940, batch_reg_loss: 0.0892, reg_loss: 0.0887 ||: 46%|####6 | 44/95 [00:30<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8614, UAS: 0.9255, LAS: 0.8619, UEM: 0.5429, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8078, partial_loss/deprel_loss: 0.8197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9065, loss: 0.9176, batch_reg_loss: 0.0893, reg_loss: 0.0887 ||: 51%|##### | 48/95 [00:32<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9226, LAS: 0.8587, UEM: 0.5308, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2410, partial_loss/deprel_loss: 1.1667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2709, loss: 0.9484, batch_reg_loss: 0.0893, reg_loss: 0.0888 ||: 54%|#####3 | 51/95 [00:35<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9237, LAS: 0.8598, UEM: 0.5345, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5769, loss: 0.9379, batch_reg_loss: 0.0894, reg_loss: 0.0888 ||: 57%|#####6 | 54/95 [00:37<00:28, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9241, LAS: 0.8602, UEM: 0.5310, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6501, partial_loss/deprel_loss: 0.8100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.9327, batch_reg_loss: 0.0895, reg_loss: 0.0888 ||: 60%|###### | 57/95 [00:39<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7886, UAS: 0.9236, LAS: 0.8593, UEM: 0.5250, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6350, partial_loss/deprel_loss: 1.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5108, loss: 0.9359, batch_reg_loss: 0.0896, reg_loss: 0.0889 ||: 64%|######4 | 61/95 [00:41<00:22, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8438, UAS: 0.9245, LAS: 0.8600, UEM: 0.5268, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 1.0441, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0757, loss: 0.9285, batch_reg_loss: 0.0897, reg_loss: 0.0889 ||: 68%|######8 | 65/95 [00:44<00:20, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8068, UAS: 0.9245, LAS: 0.8603, UEM: 0.5323, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4523, partial_loss/deprel_loss: 1.2092, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3476, loss: 0.9238, batch_reg_loss: 0.0897, reg_loss: 0.0890 ||: 72%|#######1 | 68/95 [00:46<00:19, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9241, LAS: 0.8601, UEM: 0.5268, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6872, partial_loss/deprel_loss: 0.9213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9643, loss: 0.9281, batch_reg_loss: 0.0898, reg_loss: 0.0890 ||: 75%|#######4 | 71/95 [00:49<00:17, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9234, LAS: 0.8594, UEM: 0.5213, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3491, partial_loss/deprel_loss: 1.1402, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2719, loss: 0.9356, batch_reg_loss: 0.0899, reg_loss: 0.0890 ||: 79%|#######8 | 75/95 [00:51<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9236, LAS: 0.8595, UEM: 0.5278, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3342, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6382, loss: 0.9324, batch_reg_loss: 0.0900, reg_loss: 0.0891 ||: 82%|########2 | 78/95 [00:53<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7965, UAS: 0.9235, LAS: 0.8593, UEM: 0.5329, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7970, partial_loss/deprel_loss: 1.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5456, loss: 0.9340, batch_reg_loss: 0.0901, reg_loss: 0.0891 ||: 85%|########5 | 81/95 [00:55<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9231, LAS: 0.8588, UEM: 0.5271, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5215, partial_loss/deprel_loss: 0.6945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7501, loss: 0.9381, batch_reg_loss: 0.0901, reg_loss: 0.0892 ||: 88%|########8 | 84/95 [00:57<00:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9242, LAS: 0.8600, UEM: 0.5301, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5919, partial_loss/deprel_loss: 0.7680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8230, loss: 0.9284, batch_reg_loss: 0.0902, reg_loss: 0.0892 ||: 93%|#########2| 88/95 [01:00<00:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9248, LAS: 0.8606, UEM: 0.5364, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6627, partial_loss/deprel_loss: 0.8353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8911, loss: 0.9216, batch_reg_loss: 0.0903, reg_loss: 0.0892 ||: 97%|#########6| 92/95 [01:03<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9251, LAS: 0.8608, UEM: 0.5348, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7600, partial_loss/deprel_loss: 0.8205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8988, loss: 0.9181, batch_reg_loss: 0.0904, reg_loss: 0.0893 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - reg_loss | 0.089 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UEM | 0.535 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - LEM | 0.280 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EM | 0.858 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.760 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UAS | 0.925 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.820 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - loss | 0.918 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - LAS | 0.861 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:27,263 - INFO - combo.training.trainer - Epoch duration: 0:01:04.996104\n", + "2023-04-06 23:14:27,263 - INFO - combo.training.trainer - Estimated training time remaining: 7:06:59\n", + "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - Epoch 22/399\n", + "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:14:27,269 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9550, LAS: 0.8944, UEM: 0.6711, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.6435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6794, loss: 0.6546, batch_reg_loss: 0.0904, reg_loss: 0.0904 ||: 3%|3 | 3/95 [00:02<01:12, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9571, LAS: 0.8994, UEM: 0.7498, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1352, partial_loss/deprel_loss: 0.2762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3385, loss: 0.5984, batch_reg_loss: 0.0905, reg_loss: 0.0904 ||: 6%|6 | 6/95 [00:04<01:10, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9366, LAS: 0.8751, UEM: 0.6501, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7438, partial_loss/deprel_loss: 0.9171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.7992, batch_reg_loss: 0.0906, reg_loss: 0.0905 ||: 11%|# | 10/95 [00:06<01:01, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9245, LAS: 0.8616, UEM: 0.5855, LEM: 0.3379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5410, partial_loss/deprel_loss: 0.6696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7345, loss: 0.9022, batch_reg_loss: 0.0906, reg_loss: 0.0905 ||: 15%|#4 | 14/95 [00:09<00:55, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9253, LAS: 0.8622, UEM: 0.5631, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.6379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6676, loss: 0.9063, batch_reg_loss: 0.0907, reg_loss: 0.0906 ||: 19%|#8 | 18/95 [00:11<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9255, LAS: 0.8618, UEM: 0.5433, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1120, partial_loss/deprel_loss: 1.0946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1888, loss: 0.9048, batch_reg_loss: 0.0908, reg_loss: 0.0906 ||: 22%|##2 | 21/95 [00:14<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9284, LAS: 0.8650, UEM: 0.5625, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3439, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.8739, batch_reg_loss: 0.0909, reg_loss: 0.0906 ||: 25%|##5 | 24/95 [00:16<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9261, LAS: 0.8622, UEM: 0.5615, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6291, partial_loss/deprel_loss: 0.7910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8496, loss: 0.8936, batch_reg_loss: 0.0909, reg_loss: 0.0907 ||: 28%|##8 | 27/95 [00:18<00:50, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9276, LAS: 0.8640, UEM: 0.5600, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7352, partial_loss/deprel_loss: 0.9390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9892, loss: 0.8841, batch_reg_loss: 0.0910, reg_loss: 0.0907 ||: 32%|###1 | 30/95 [00:21<00:47, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9267, LAS: 0.8631, UEM: 0.5387, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7497, partial_loss/deprel_loss: 0.8094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8885, loss: 0.8920, batch_reg_loss: 0.0911, reg_loss: 0.0907 ||: 35%|###4 | 33/95 [00:23<00:44, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9277, LAS: 0.8640, UEM: 0.5550, LEM: 0.2830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3010, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.8830, batch_reg_loss: 0.0912, reg_loss: 0.0908 ||: 39%|###8 | 37/95 [00:26<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9279, LAS: 0.8642, UEM: 0.5553, LEM: 0.2845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8983, partial_loss/deprel_loss: 1.0623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1207, loss: 0.8820, batch_reg_loss: 0.0912, reg_loss: 0.0908 ||: 42%|####2 | 40/95 [00:28<00:40, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9271, LAS: 0.8628, UEM: 0.5414, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0324, partial_loss/deprel_loss: 1.0027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0999, loss: 0.8922, batch_reg_loss: 0.0913, reg_loss: 0.0908 ||: 45%|####5 | 43/95 [00:30<00:37, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.9257, LAS: 0.8616, UEM: 0.5265, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1586, partial_loss/deprel_loss: 1.1841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2703, loss: 0.9049, batch_reg_loss: 0.0914, reg_loss: 0.0909 ||: 49%|####9 | 47/95 [00:33<00:33, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8048, UAS: 0.9250, LAS: 0.8605, UEM: 0.5145, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3112, partial_loss/deprel_loss: 1.1704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2900, loss: 0.9120, batch_reg_loss: 0.0915, reg_loss: 0.0909 ||: 54%|#####3 | 51/95 [00:35<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9254, LAS: 0.8609, UEM: 0.5121, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2439, partial_loss/deprel_loss: 0.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.9080, batch_reg_loss: 0.0915, reg_loss: 0.0910 ||: 58%|#####7 | 55/95 [00:38<00:26, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9269, LAS: 0.8626, UEM: 0.5298, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4415, loss: 0.8933, batch_reg_loss: 0.0916, reg_loss: 0.0910 ||: 61%|######1 | 58/95 [00:40<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9246, LAS: 0.8602, UEM: 0.5197, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7664, partial_loss/deprel_loss: 0.9591, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0123, loss: 0.9131, batch_reg_loss: 0.0917, reg_loss: 0.0910 ||: 65%|######5 | 62/95 [00:42<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9247, LAS: 0.8607, UEM: 0.5253, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4750, partial_loss/deprel_loss: 0.7193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7622, loss: 0.9094, batch_reg_loss: 0.0918, reg_loss: 0.0911 ||: 69%|######9 | 66/95 [00:45<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8741, UAS: 0.9260, LAS: 0.8624, UEM: 0.5400, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4970, partial_loss/deprel_loss: 0.6956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.8936, batch_reg_loss: 0.0919, reg_loss: 0.0911 ||: 74%|#######3 | 70/95 [00:48<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9253, LAS: 0.8616, UEM: 0.5566, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0800, partial_loss/deprel_loss: 0.2153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2802, loss: 0.9009, batch_reg_loss: 0.0920, reg_loss: 0.0912 ||: 77%|#######6 | 73/95 [00:51<00:16, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9253, LAS: 0.8615, UEM: 0.5530, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8445, partial_loss/deprel_loss: 1.0010, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0617, loss: 0.9044, batch_reg_loss: 0.0920, reg_loss: 0.0912 ||: 80%|######## | 76/95 [00:53<00:14, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9254, LAS: 0.8613, UEM: 0.5480, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5778, partial_loss/deprel_loss: 0.8384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8784, loss: 0.9069, batch_reg_loss: 0.0921, reg_loss: 0.0912 ||: 84%|########4 | 80/95 [00:56<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8113, UAS: 0.9241, LAS: 0.8598, UEM: 0.5398, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6084, partial_loss/deprel_loss: 1.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4375, loss: 0.9203, batch_reg_loss: 0.0922, reg_loss: 0.0913 ||: 87%|########7 | 83/95 [00:58<00:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9246, LAS: 0.8605, UEM: 0.5373, LEM: 0.2892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8148, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9702, loss: 0.9162, batch_reg_loss: 0.0922, reg_loss: 0.0913 ||: 91%|######### | 86/95 [01:00<00:06, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9245, LAS: 0.8603, UEM: 0.5389, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.5576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6059, loss: 0.9188, batch_reg_loss: 0.0923, reg_loss: 0.0913 ||: 95%|#########4| 90/95 [01:03<00:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9248, LAS: 0.8607, UEM: 0.5360, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7173, partial_loss/deprel_loss: 0.9406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9883, loss: 0.9151, batch_reg_loss: 0.0924, reg_loss: 0.0914 ||: 99%|#########8| 94/95 [01:05<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9250, LAS: 0.8609, UEM: 0.5356, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5528, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.9139, batch_reg_loss: 0.0924, reg_loss: 0.0914 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - reg_loss | 0.091 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UEM | 0.536 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - LEM | 0.285 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EM | 0.878 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.553 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UAS | 0.925 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.745 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - loss | 0.914 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - LAS | 0.861 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:15:33,696 - INFO - combo.training.trainer - Epoch duration: 0:01:06.432977\n", + "2023-04-06 23:15:33,696 - INFO - combo.training.trainer - Estimated training time remaining: 7:05:29\n", + "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - Epoch 23/399\n", + "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:15:33,703 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9396, LAS: 0.8879, UEM: 0.7813, LEM: 0.6526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9156, partial_loss/deprel_loss: 0.9224, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0136, loss: 0.7480, batch_reg_loss: 0.0925, reg_loss: 0.0925 ||: 3%|3 | 3/95 [00:02<01:13, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9246, LAS: 0.8641, UEM: 0.6055, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8152, partial_loss/deprel_loss: 0.9452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0118, loss: 0.9061, batch_reg_loss: 0.0926, reg_loss: 0.0925 ||: 7%|7 | 7/95 [00:04<01:05, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9336, LAS: 0.8745, UEM: 0.6267, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.6305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.8215, batch_reg_loss: 0.0927, reg_loss: 0.0926 ||: 11%|# | 10/95 [00:07<01:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9333, LAS: 0.8736, UEM: 0.5851, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9253, partial_loss/deprel_loss: 0.9607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0464, loss: 0.8242, batch_reg_loss: 0.0928, reg_loss: 0.0926 ||: 15%|#4 | 14/95 [00:09<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9306, LAS: 0.8685, UEM: 0.5478, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3530, partial_loss/deprel_loss: 0.6736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7023, loss: 0.8645, batch_reg_loss: 0.0928, reg_loss: 0.0927 ||: 19%|#8 | 18/95 [00:11<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9233, LAS: 0.8608, UEM: 0.5436, LEM: 0.3292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3514, partial_loss/deprel_loss: 0.4489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5223, loss: 0.9171, batch_reg_loss: 0.0929, reg_loss: 0.0927 ||: 22%|##2 | 21/95 [00:14<00:51, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9229, LAS: 0.8595, UEM: 0.5345, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9966, partial_loss/deprel_loss: 1.0144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1038, loss: 0.9269, batch_reg_loss: 0.0930, reg_loss: 0.0927 ||: 26%|##6 | 25/95 [00:16<00:47, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9235, LAS: 0.8599, UEM: 0.5237, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4287, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.9253, batch_reg_loss: 0.0931, reg_loss: 0.0928 ||: 29%|##9 | 28/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9257, LAS: 0.8626, UEM: 0.5416, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1919, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.9015, batch_reg_loss: 0.0931, reg_loss: 0.0928 ||: 33%|###2 | 31/95 [00:21<00:44, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.9265, LAS: 0.8633, UEM: 0.5546, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1036, partial_loss/deprel_loss: 1.1616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2432, loss: 0.8961, batch_reg_loss: 0.0932, reg_loss: 0.0928 ||: 36%|###5 | 34/95 [00:23<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9280, LAS: 0.8649, UEM: 0.5659, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4681, partial_loss/deprel_loss: 0.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7734, loss: 0.8842, batch_reg_loss: 0.0933, reg_loss: 0.0929 ||: 39%|###8 | 37/95 [00:25<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9282, LAS: 0.8651, UEM: 0.5715, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2860, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5780, loss: 0.8838, batch_reg_loss: 0.0933, reg_loss: 0.0929 ||: 42%|####2 | 40/95 [00:27<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.9280, LAS: 0.8651, UEM: 0.5746, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6112, partial_loss/deprel_loss: 1.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4135, loss: 0.8834, batch_reg_loss: 0.0934, reg_loss: 0.0929 ||: 45%|####5 | 43/95 [00:30<00:40, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9286, LAS: 0.8656, UEM: 0.5680, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6863, partial_loss/deprel_loss: 0.8954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9471, loss: 0.8781, batch_reg_loss: 0.0935, reg_loss: 0.0930 ||: 48%|####8 | 46/95 [00:33<00:39, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9281, LAS: 0.8651, UEM: 0.5619, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2999, partial_loss/deprel_loss: 1.2194, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3291, loss: 0.8818, batch_reg_loss: 0.0935, reg_loss: 0.0930 ||: 52%|#####1 | 49/95 [00:35<00:35, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9284, LAS: 0.8654, UEM: 0.5685, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4109, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3804, loss: 0.8792, batch_reg_loss: 0.0936, reg_loss: 0.0930 ||: 55%|#####4 | 52/95 [00:39<00:39, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9290, LAS: 0.8665, UEM: 0.5837, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1328, partial_loss/deprel_loss: 0.2806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3447, loss: 0.8706, batch_reg_loss: 0.0937, reg_loss: 0.0931 ||: 58%|#####7 | 55/95 [00:41<00:35, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9294, LAS: 0.8665, UEM: 0.5767, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7648, partial_loss/deprel_loss: 0.9760, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0275, loss: 0.8704, batch_reg_loss: 0.0937, reg_loss: 0.0931 ||: 61%|######1 | 58/95 [00:43<00:31, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9308, LAS: 0.8682, UEM: 0.5835, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.5147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.8553, batch_reg_loss: 0.0938, reg_loss: 0.0931 ||: 64%|######4 | 61/95 [00:46<00:27, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9294, LAS: 0.8665, UEM: 0.5760, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8493, partial_loss/deprel_loss: 0.9959, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0604, loss: 0.8729, batch_reg_loss: 0.0939, reg_loss: 0.0932 ||: 68%|######8 | 65/95 [00:48<00:23, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9290, LAS: 0.8658, UEM: 0.5684, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4934, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7159, loss: 0.8777, batch_reg_loss: 0.0939, reg_loss: 0.0932 ||: 72%|#######1 | 68/95 [00:50<00:20, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9287, LAS: 0.8654, UEM: 0.5604, LEM: 0.3071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7519, partial_loss/deprel_loss: 0.8984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9631, loss: 0.8827, batch_reg_loss: 0.0940, reg_loss: 0.0932 ||: 75%|#######4 | 71/95 [00:52<00:17, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7866, UAS: 0.9278, LAS: 0.8644, UEM: 0.5533, LEM: 0.3016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6260, partial_loss/deprel_loss: 1.3245, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4789, loss: 0.8904, batch_reg_loss: 0.0941, reg_loss: 0.0933 ||: 78%|#######7 | 74/95 [00:55<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7768, UAS: 0.9264, LAS: 0.8628, UEM: 0.5454, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9205, partial_loss/deprel_loss: 1.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6140, loss: 0.9026, batch_reg_loss: 0.0941, reg_loss: 0.0933 ||: 81%|########1 | 77/95 [00:57<00:12, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8221, UAS: 0.9259, LAS: 0.8622, UEM: 0.5381, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2362, partial_loss/deprel_loss: 1.1283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2441, loss: 0.9077, batch_reg_loss: 0.0942, reg_loss: 0.0933 ||: 84%|########4 | 80/95 [00:59<00:10, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8262, UAS: 0.9257, LAS: 0.8619, UEM: 0.5395, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1983, partial_loss/deprel_loss: 1.1750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2739, loss: 0.9105, batch_reg_loss: 0.0943, reg_loss: 0.0934 ||: 87%|########7 | 83/95 [01:01<00:08, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8201, UAS: 0.9257, LAS: 0.8619, UEM: 0.5385, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0666, partial_loss/deprel_loss: 1.1067, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1930, loss: 0.9104, batch_reg_loss: 0.0944, reg_loss: 0.0934 ||: 91%|######### | 86/95 [01:03<00:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9265, LAS: 0.8628, UEM: 0.5374, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.5369, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5849, loss: 0.9043, batch_reg_loss: 0.0945, reg_loss: 0.0935 ||: 95%|#########4| 90/95 [01:06<00:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8174, UAS: 0.9268, LAS: 0.8631, UEM: 0.5373, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2839, partial_loss/deprel_loss: 1.1413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2644, loss: 0.9027, batch_reg_loss: 0.0946, reg_loss: 0.0935 ||: 99%|#########8| 94/95 [01:08<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8302, UAS: 0.9264, LAS: 0.8628, UEM: 0.5351, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2075, partial_loss/deprel_loss: 1.1032, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2186, loss: 0.9061, batch_reg_loss: 0.0946, reg_loss: 0.0935 ||: 100%|##########| 95/95 [01:09<00:00, 1.37it/s]\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - reg_loss | 0.094 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - UEM | 0.535 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - LEM | 0.285 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EM | 0.830 | N/A\n", + "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.207 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - UAS | 0.926 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.103 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - loss | 0.906 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - LAS | 0.863 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:43,093 - INFO - combo.training.trainer - Epoch duration: 0:01:09.396964\n", + "2023-04-06 23:16:43,093 - INFO - combo.training.trainer - Estimated training time remaining: 7:04:48\n", + "2023-04-06 23:16:43,093 - INFO - allennlp.training.trainer - Epoch 24/399\n", + "2023-04-06 23:16:43,093 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:16:43,094 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:16:43,100 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9249, LAS: 0.8612, UEM: 0.3056, LEM: 0.0894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6457, partial_loss/deprel_loss: 0.7513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8249, loss: 0.9038, batch_reg_loss: 0.0947, reg_loss: 0.0946 ||: 4%|4 | 4/95 [00:02<00:56, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9331, LAS: 0.8720, UEM: 0.4283, LEM: 0.1824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2924, partial_loss/deprel_loss: 0.4524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5151, loss: 0.8246, batch_reg_loss: 0.0947, reg_loss: 0.0947 ||: 7%|7 | 7/95 [00:04<00:56, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9360, LAS: 0.8737, UEM: 0.4721, LEM: 0.2128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4536, partial_loss/deprel_loss: 0.6589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.8078, batch_reg_loss: 0.0948, reg_loss: 0.0947 ||: 11%|# | 10/95 [00:07<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9323, LAS: 0.8695, UEM: 0.4776, LEM: 0.2093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3617, partial_loss/deprel_loss: 0.6263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6682, loss: 0.8369, batch_reg_loss: 0.0949, reg_loss: 0.0947 ||: 14%|#3 | 13/95 [00:09<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9316, LAS: 0.8699, UEM: 0.4900, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2622, partial_loss/deprel_loss: 1.1134, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2381, loss: 0.8428, batch_reg_loss: 0.0949, reg_loss: 0.0948 ||: 18%|#7 | 17/95 [00:11<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9322, LAS: 0.8705, UEM: 0.5049, LEM: 0.2429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.4451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.8404, batch_reg_loss: 0.0950, reg_loss: 0.0948 ||: 21%|##1 | 20/95 [00:13<00:51, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9301, LAS: 0.8684, UEM: 0.4812, LEM: 0.2256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.7618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8170, loss: 0.8559, batch_reg_loss: 0.0951, reg_loss: 0.0948 ||: 25%|##5 | 24/95 [00:16<00:46, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9300, LAS: 0.8688, UEM: 0.5011, LEM: 0.2415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2828, partial_loss/deprel_loss: 0.4777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.8527, batch_reg_loss: 0.0952, reg_loss: 0.0949 ||: 28%|##8 | 27/95 [00:18<00:46, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9327, LAS: 0.8717, UEM: 0.5366, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6499, partial_loss/deprel_loss: 0.8602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9134, loss: 0.8289, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||: 33%|###2 | 31/95 [00:20<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9316, LAS: 0.8703, UEM: 0.5202, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8491, partial_loss/deprel_loss: 0.8918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 0.8418, batch_reg_loss: 0.0953, reg_loss: 0.0950 ||: 36%|###5 | 34/95 [00:22<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9334, LAS: 0.8725, UEM: 0.5423, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4035, partial_loss/deprel_loss: 0.6322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6819, loss: 0.8235, batch_reg_loss: 0.0954, reg_loss: 0.0950 ||: 39%|###8 | 37/95 [00:25<00:42, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8001, UAS: 0.9309, LAS: 0.8697, UEM: 0.5260, LEM: 0.2675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4140, partial_loss/deprel_loss: 1.2018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3397, loss: 0.8425, batch_reg_loss: 0.0955, reg_loss: 0.0950 ||: 42%|####2 | 40/95 [00:27<00:40, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9311, LAS: 0.8699, UEM: 0.5406, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1469, partial_loss/deprel_loss: 0.3664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4180, loss: 0.8396, batch_reg_loss: 0.0955, reg_loss: 0.0951 ||: 45%|####5 | 43/95 [00:30<00:39, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9293, LAS: 0.8681, UEM: 0.5387, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2984, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6031, loss: 0.8573, batch_reg_loss: 0.0956, reg_loss: 0.0951 ||: 48%|####8 | 46/95 [00:32<00:36, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9308, LAS: 0.8700, UEM: 0.5586, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.6094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6677, loss: 0.8396, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||: 52%|#####1 | 49/95 [00:34<00:35, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9300, LAS: 0.8688, UEM: 0.5567, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0885, partial_loss/deprel_loss: 1.0907, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1860, loss: 0.8510, batch_reg_loss: 0.0957, reg_loss: 0.0952 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8210, UAS: 0.9292, LAS: 0.8678, UEM: 0.5456, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2178, partial_loss/deprel_loss: 1.1537, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2623, loss: 0.8606, batch_reg_loss: 0.0958, reg_loss: 0.0952 ||: 59%|#####8 | 56/95 [00:39<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9287, LAS: 0.8669, UEM: 0.5385, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2499, partial_loss/deprel_loss: 1.1162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2388, loss: 0.8674, batch_reg_loss: 0.0959, reg_loss: 0.0952 ||: 63%|######3 | 60/95 [00:41<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9286, LAS: 0.8667, UEM: 0.5355, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2946, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5636, loss: 0.8687, batch_reg_loss: 0.0960, reg_loss: 0.0953 ||: 67%|######7 | 64/95 [00:43<00:19, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8406, UAS: 0.9291, LAS: 0.8674, UEM: 0.5448, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9763, partial_loss/deprel_loss: 0.9913, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8637, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||: 72%|#######1 | 68/95 [00:46<00:17, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9284, LAS: 0.8665, UEM: 0.5365, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3328, partial_loss/deprel_loss: 1.2516, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3640, loss: 0.8735, batch_reg_loss: 0.0962, reg_loss: 0.0954 ||: 76%|#######5 | 72/95 [00:48<00:14, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9294, LAS: 0.8672, UEM: 0.5403, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3011, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6034, loss: 0.8663, batch_reg_loss: 0.0963, reg_loss: 0.0954 ||: 81%|########1 | 77/95 [00:51<00:10, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9286, LAS: 0.8664, UEM: 0.5539, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1272, partial_loss/deprel_loss: 1.1322, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2275, loss: 0.8750, batch_reg_loss: 0.0964, reg_loss: 0.0955 ||: 85%|########5 | 81/95 [00:53<00:08, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7664, UAS: 0.9275, LAS: 0.8651, UEM: 0.5479, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1046, partial_loss/deprel_loss: 1.5443, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7528, loss: 0.8858, batch_reg_loss: 0.0965, reg_loss: 0.0955 ||: 89%|########9 | 85/95 [00:56<00:06, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8017, UAS: 0.9272, LAS: 0.8646, UEM: 0.5430, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4042, partial_loss/deprel_loss: 1.3009, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4182, loss: 0.8911, batch_reg_loss: 0.0966, reg_loss: 0.0956 ||: 94%|#########3| 89/95 [00:59<00:03, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9267, LAS: 0.8640, UEM: 0.5401, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7409, partial_loss/deprel_loss: 0.8910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9577, loss: 0.8968, batch_reg_loss: 0.0967, reg_loss: 0.0956 ||: 98%|#########7| 93/95 [01:01<00:01, 1.56it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9270, LAS: 0.8644, UEM: 0.5390, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9299, loss: 0.8950, batch_reg_loss: 0.0967, reg_loss: 0.0956 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-06 23:17:46,366 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - reg_loss | 0.096 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UEM | 0.539 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - LEM | 0.289 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EM | 0.865 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.682 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UAS | 0.927 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.871 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - loss | 0.895 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - LAS | 0.864 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.trainer - Epoch duration: 0:01:03.275262\n", + "2023-04-06 23:17:46,368 - INFO - combo.training.trainer - Estimated training time remaining: 7:02:32\n", + "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - Epoch 25/399\n", + "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:17:46,375 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9189, LAS: 0.8572, UEM: 0.6852, LEM: 0.5232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1098, partial_loss/deprel_loss: 0.3017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.9374, batch_reg_loss: 0.0968, reg_loss: 0.0967 ||: 3%|3 | 3/95 [00:02<01:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8290, UAS: 0.9208, LAS: 0.8558, UEM: 0.5725, LEM: 0.3888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1098, partial_loss/deprel_loss: 1.1618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2482, loss: 0.9715, batch_reg_loss: 0.0969, reg_loss: 0.0968 ||: 7%|7 | 7/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9256, LAS: 0.8627, UEM: 0.5164, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 0.7931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8813, loss: 0.9090, batch_reg_loss: 0.0970, reg_loss: 0.0968 ||: 12%|#1 | 11/95 [00:07<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9256, LAS: 0.8639, UEM: 0.6032, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0652, partial_loss/deprel_loss: 0.1868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2595, loss: 0.9034, batch_reg_loss: 0.0970, reg_loss: 0.0969 ||: 15%|#4 | 14/95 [00:09<01:00, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9313, LAS: 0.8700, UEM: 0.6227, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3785, partial_loss/deprel_loss: 0.5911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.8529, batch_reg_loss: 0.0971, reg_loss: 0.0969 ||: 18%|#7 | 17/95 [00:12<00:57, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9294, LAS: 0.8675, UEM: 0.5875, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4364, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8762, batch_reg_loss: 0.0972, reg_loss: 0.0970 ||: 22%|##2 | 21/95 [00:14<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9292, LAS: 0.8669, UEM: 0.5596, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.7809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8110, loss: 0.8809, batch_reg_loss: 0.0973, reg_loss: 0.0970 ||: 26%|##6 | 25/95 [00:17<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9298, LAS: 0.8674, UEM: 0.5522, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6590, partial_loss/deprel_loss: 0.8291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8925, loss: 0.8776, batch_reg_loss: 0.0974, reg_loss: 0.0970 ||: 29%|##9 | 28/95 [00:19<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.9299, LAS: 0.8680, UEM: 0.5456, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9874, partial_loss/deprel_loss: 1.0991, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1742, loss: 0.8726, batch_reg_loss: 0.0974, reg_loss: 0.0971 ||: 34%|###3 | 32/95 [00:21<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9290, LAS: 0.8669, UEM: 0.5328, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7105, loss: 0.8782, batch_reg_loss: 0.0975, reg_loss: 0.0971 ||: 38%|###7 | 36/95 [00:24<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8141, UAS: 0.9284, LAS: 0.8662, UEM: 0.5361, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4523, partial_loss/deprel_loss: 1.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3896, loss: 0.8849, batch_reg_loss: 0.0976, reg_loss: 0.0972 ||: 41%|####1 | 39/95 [00:26<00:39, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7732, UAS: 0.9246, LAS: 0.8615, UEM: 0.5251, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9087, partial_loss/deprel_loss: 1.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6392, loss: 0.9204, batch_reg_loss: 0.0977, reg_loss: 0.0972 ||: 44%|####4 | 42/95 [00:29<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9254, LAS: 0.8623, UEM: 0.5276, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7164, loss: 0.9134, batch_reg_loss: 0.0977, reg_loss: 0.0972 ||: 47%|####7 | 45/95 [00:31<00:37, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9226, LAS: 0.8588, UEM: 0.5102, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8822, partial_loss/deprel_loss: 0.9684, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0490, loss: 0.9447, batch_reg_loss: 0.0978, reg_loss: 0.0973 ||: 52%|#####1 | 49/95 [00:34<00:32, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9239, LAS: 0.8604, UEM: 0.5140, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3090, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5426, loss: 0.9326, batch_reg_loss: 0.0979, reg_loss: 0.0973 ||: 56%|#####5 | 53/95 [00:36<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9247, LAS: 0.8612, UEM: 0.5259, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1767, partial_loss/deprel_loss: 0.3957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.9250, batch_reg_loss: 0.0980, reg_loss: 0.0974 ||: 60%|###### | 57/95 [00:39<00:25, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9248, LAS: 0.8615, UEM: 0.5254, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2928, partial_loss/deprel_loss: 0.5556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.9223, batch_reg_loss: 0.0981, reg_loss: 0.0974 ||: 64%|######4 | 61/95 [00:42<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7954, UAS: 0.9250, LAS: 0.8616, UEM: 0.5250, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6197, partial_loss/deprel_loss: 1.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4504, loss: 0.9219, batch_reg_loss: 0.0982, reg_loss: 0.0975 ||: 68%|######8 | 65/95 [00:44<00:20, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9256, LAS: 0.8623, UEM: 0.5224, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2762, partial_loss/deprel_loss: 0.5328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.9149, batch_reg_loss: 0.0983, reg_loss: 0.0975 ||: 73%|#######2 | 69/95 [00:47<00:17, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9260, LAS: 0.8628, UEM: 0.5265, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2881, partial_loss/deprel_loss: 0.4474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5140, loss: 0.9117, batch_reg_loss: 0.0984, reg_loss: 0.0976 ||: 77%|#######6 | 73/95 [00:49<00:14, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8064, UAS: 0.9260, LAS: 0.8628, UEM: 0.5274, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3724, partial_loss/deprel_loss: 1.1643, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3044, loss: 0.9094, batch_reg_loss: 0.0985, reg_loss: 0.0976 ||: 81%|########1 | 77/95 [00:52<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9267, LAS: 0.8637, UEM: 0.5316, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3660, partial_loss/deprel_loss: 0.5573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.9028, batch_reg_loss: 0.0985, reg_loss: 0.0976 ||: 84%|########4 | 80/95 [00:54<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9264, LAS: 0.8632, UEM: 0.5251, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5652, partial_loss/deprel_loss: 0.8186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8665, loss: 0.9087, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||: 87%|########7 | 83/95 [00:57<00:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9272, LAS: 0.8641, UEM: 0.5284, LEM: 0.2816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5205, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7597, loss: 0.9006, batch_reg_loss: 0.0987, reg_loss: 0.0977 ||: 91%|######### | 86/95 [00:59<00:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9273, LAS: 0.8641, UEM: 0.5355, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4141, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6806, loss: 0.8981, batch_reg_loss: 0.0987, reg_loss: 0.0977 ||: 94%|#########3| 89/95 [01:01<00:04, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9277, LAS: 0.8647, UEM: 0.5379, LEM: 0.2892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5813, partial_loss/deprel_loss: 0.7569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8206, loss: 0.8927, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 97%|#########6| 92/95 [01:03<00:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9283, LAS: 0.8652, UEM: 0.5407, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8872, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 100%|##########| 95/95 [01:06<00:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9283, LAS: 0.8652, UEM: 0.5407, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8872, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:18:52,458 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9213, LAS: 0.8628, UEM: 0.3785, LEM: 0.1168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4790, partial_loss/deprel_loss: 23.3874, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8057, loss: 31.9415, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.07s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9251, LAS: 0.8630, UEM: 0.3372, LEM: 0.1015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8384, partial_loss/deprel_loss: 42.7479, partial_loss/cycle_loss: 0.0000, batch_loss: 34.3660, loss: 31.7453, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:06, 1.03s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9405, LAS: 0.8815, UEM: 0.5725, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4084, partial_loss/deprel_loss: 28.1948, partial_loss/cycle_loss: 0.0000, batch_loss: 22.6376, loss: 27.6476, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9460, LAS: 0.8885, UEM: 0.6523, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7674, partial_loss/deprel_loss: 32.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4835, loss: 25.6424, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9460, LAS: 0.8885, UEM: 0.6523, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7674, partial_loss/deprel_loss: 32.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4835, loss: 25.6424, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "2023-04-06 23:19:03,065 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - reg_loss | 0.098 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UEM | 0.541 | 0.652\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - LEM | 0.290 | 0.380\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EM | 0.876 | 0.873\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.555 | 0.767\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UAS | 0.928 | 0.946\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.729 | 32.913\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - loss | 0.887 | 25.642\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - LAS | 0.865 | 0.888\n", + "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.trainer - Epoch duration: 0:01:16.698692\n", + "2023-04-06 23:19:03,067 - INFO - combo.training.trainer - Estimated training time remaining: 7:03:35\n", + "2023-04-06 23:19:03,067 - INFO - allennlp.training.trainer - Epoch 26/399\n", + "2023-04-06 23:19:03,068 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:19:03,068 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:19:03,074 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8072, UAS: 0.9113, LAS: 0.8445, UEM: 0.2432, LEM: 0.0822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4756, partial_loss/deprel_loss: 1.1600, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3220, loss: 1.0506, batch_reg_loss: 0.0989, reg_loss: 0.0989 ||: 3%|3 | 3/95 [00:02<01:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9313, LAS: 0.8702, UEM: 0.6215, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5793, loss: 0.8482, batch_reg_loss: 0.0990, reg_loss: 0.0989 ||: 6%|6 | 6/95 [00:04<01:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8316, UAS: 0.9333, LAS: 0.8707, UEM: 0.5914, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0801, partial_loss/deprel_loss: 1.0039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1181, loss: 0.8360, batch_reg_loss: 0.0990, reg_loss: 0.0989 ||: 9%|9 | 9/95 [00:06<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9310, LAS: 0.8692, UEM: 0.5342, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9169, partial_loss/deprel_loss: 0.8493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9619, loss: 0.8448, batch_reg_loss: 0.0991, reg_loss: 0.0990 ||: 14%|#3 | 13/95 [00:08<00:54, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9347, LAS: 0.8743, UEM: 0.6199, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0694, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2668, loss: 0.8110, batch_reg_loss: 0.0991, reg_loss: 0.0990 ||: 17%|#6 | 16/95 [00:11<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9389, LAS: 0.8791, UEM: 0.6526, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1531, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4165, loss: 0.7715, batch_reg_loss: 0.0992, reg_loss: 0.0990 ||: 20%|## | 19/95 [00:13<00:57, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8427, UAS: 0.9359, LAS: 0.8755, UEM: 0.6283, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0335, partial_loss/deprel_loss: 0.9413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0590, loss: 0.8061, batch_reg_loss: 0.0993, reg_loss: 0.0991 ||: 23%|##3 | 22/95 [00:15<00:55, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9358, LAS: 0.8751, UEM: 0.6096, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 0.8102, batch_reg_loss: 0.0993, reg_loss: 0.0991 ||: 27%|##7 | 26/95 [00:18<00:49, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9367, LAS: 0.8759, UEM: 0.5972, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4592, partial_loss/deprel_loss: 0.6983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7499, loss: 0.8017, batch_reg_loss: 0.0994, reg_loss: 0.0991 ||: 32%|###1 | 30/95 [00:20<00:43, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7727, UAS: 0.9329, LAS: 0.8714, UEM: 0.5814, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0666, partial_loss/deprel_loss: 1.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7008, loss: 0.8388, batch_reg_loss: 0.0995, reg_loss: 0.0992 ||: 35%|###4 | 33/95 [00:22<00:42, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9321, LAS: 0.8707, UEM: 0.5792, LEM: 0.3314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5242, partial_loss/deprel_loss: 0.6863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7535, loss: 0.8426, batch_reg_loss: 0.0996, reg_loss: 0.0992 ||: 38%|###7 | 36/95 [00:25<00:41, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9335, LAS: 0.8721, UEM: 0.5865, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4779, loss: 0.8318, batch_reg_loss: 0.0996, reg_loss: 0.0992 ||: 41%|####1 | 39/95 [00:27<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9334, LAS: 0.8717, UEM: 0.5767, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7608, partial_loss/deprel_loss: 0.8941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9672, loss: 0.8360, batch_reg_loss: 0.0997, reg_loss: 0.0993 ||: 44%|####4 | 42/95 [00:29<00:37, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8195, UAS: 0.9308, LAS: 0.8689, UEM: 0.5553, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2714, partial_loss/deprel_loss: 1.1683, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2887, loss: 0.8602, batch_reg_loss: 0.0998, reg_loss: 0.0993 ||: 48%|####8 | 46/95 [00:31<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9302, LAS: 0.8681, UEM: 0.5470, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9463, loss: 0.8662, batch_reg_loss: 0.0999, reg_loss: 0.0993 ||: 53%|#####2 | 50/95 [00:34<00:29, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9290, LAS: 0.8667, UEM: 0.5389, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3298, partial_loss/deprel_loss: 0.5372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5956, loss: 0.8754, batch_reg_loss: 0.1000, reg_loss: 0.0994 ||: 57%|#####6 | 54/95 [00:37<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9298, LAS: 0.8677, UEM: 0.5382, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.6646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7194, loss: 0.8674, batch_reg_loss: 0.1000, reg_loss: 0.0994 ||: 60%|###### | 57/95 [00:39<00:26, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9305, LAS: 0.8687, UEM: 0.5427, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.7491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8190, loss: 0.8575, batch_reg_loss: 0.1001, reg_loss: 0.0995 ||: 63%|######3 | 60/95 [00:41<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9314, LAS: 0.8696, UEM: 0.5507, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.5318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5907, loss: 0.8503, batch_reg_loss: 0.1002, reg_loss: 0.0995 ||: 66%|######6 | 63/95 [00:43<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9325, LAS: 0.8710, UEM: 0.5650, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.4833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5358, loss: 0.8399, batch_reg_loss: 0.1002, reg_loss: 0.0995 ||: 69%|######9 | 66/95 [00:45<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9321, LAS: 0.8707, UEM: 0.5562, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5490, partial_loss/deprel_loss: 0.6523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7320, loss: 0.8437, batch_reg_loss: 0.1003, reg_loss: 0.0996 ||: 74%|#######3 | 70/95 [00:48<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9299, LAS: 0.8679, UEM: 0.5506, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0729, partial_loss/deprel_loss: 1.0520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1566, loss: 0.8650, batch_reg_loss: 0.1004, reg_loss: 0.0996 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9310, LAS: 0.8692, UEM: 0.5607, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5735, loss: 0.8541, batch_reg_loss: 0.1005, reg_loss: 0.0996 ||: 81%|########1 | 77/95 [00:53<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9311, LAS: 0.8690, UEM: 0.5606, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3240, partial_loss/deprel_loss: 0.5033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.8555, batch_reg_loss: 0.1006, reg_loss: 0.0997 ||: 85%|########5 | 81/95 [00:55<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7720, UAS: 0.9296, LAS: 0.8672, UEM: 0.5546, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9315, partial_loss/deprel_loss: 1.4020, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6085, loss: 0.8708, batch_reg_loss: 0.1006, reg_loss: 0.0997 ||: 89%|########9 | 85/95 [00:58<00:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9295, LAS: 0.8671, UEM: 0.5508, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.5579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.8730, batch_reg_loss: 0.1007, reg_loss: 0.0998 ||: 94%|#########3| 89/95 [01:00<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8302, UAS: 0.9282, LAS: 0.8654, UEM: 0.5411, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2976, partial_loss/deprel_loss: 1.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2402, loss: 0.8888, batch_reg_loss: 0.1008, reg_loss: 0.0998 ||: 98%|#########7| 93/95 [01:03<00:01, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8521, UAS: 0.9284, LAS: 0.8657, UEM: 0.5413, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.9193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9951, loss: 0.8863, batch_reg_loss: 0.1009, reg_loss: 0.0998 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - reg_loss | 0.100 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - UEM | 0.541 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - LEM | 0.288 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EM | 0.852 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.794 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - UAS | 0.928 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.919 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - loss | 0.886 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - LAS | 0.866 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,749 - INFO - combo.training.trainer - Epoch duration: 0:01:04.681370\n", + "2023-04-06 23:20:07,749 - INFO - combo.training.trainer - Estimated training time remaining: 7:01:42\n", + "2023-04-06 23:20:07,749 - INFO - allennlp.training.trainer - Epoch 27/399\n", + "2023-04-06 23:20:07,749 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:20:07,750 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:20:07,756 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9402, LAS: 0.8809, UEM: 0.6214, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0407, partial_loss/deprel_loss: 0.9975, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1071, loss: 0.7497, batch_reg_loss: 0.1009, reg_loss: 0.1009 ||: 3%|3 | 3/95 [00:02<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9328, LAS: 0.8730, UEM: 0.5754, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.5776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6473, loss: 0.8459, batch_reg_loss: 0.1010, reg_loss: 0.1010 ||: 7%|7 | 7/95 [00:04<01:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9262, LAS: 0.8658, UEM: 0.5596, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2200, partial_loss/deprel_loss: 1.0964, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2222, loss: 0.9046, batch_reg_loss: 0.1011, reg_loss: 0.1010 ||: 12%|#1 | 11/95 [00:07<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9303, LAS: 0.8699, UEM: 0.5420, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2592, partial_loss/deprel_loss: 0.5424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.8664, batch_reg_loss: 0.1012, reg_loss: 0.1011 ||: 16%|#5 | 15/95 [00:09<00:52, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9321, LAS: 0.8715, UEM: 0.5462, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8517, batch_reg_loss: 0.1013, reg_loss: 0.1011 ||: 19%|#8 | 18/95 [00:11<00:51, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9278, LAS: 0.8668, UEM: 0.5127, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2996, partial_loss/deprel_loss: 1.0387, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1922, loss: 0.8887, batch_reg_loss: 0.1014, reg_loss: 0.1011 ||: 22%|##2 | 21/95 [00:13<00:50, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7923, UAS: 0.9247, LAS: 0.8633, UEM: 0.5101, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7245, partial_loss/deprel_loss: 1.2478, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4445, loss: 0.9164, batch_reg_loss: 0.1014, reg_loss: 0.1012 ||: 25%|##5 | 24/95 [00:15<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9267, LAS: 0.8652, UEM: 0.5210, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8427, partial_loss/deprel_loss: 0.8735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9689, loss: 0.8957, batch_reg_loss: 0.1015, reg_loss: 0.1012 ||: 28%|##8 | 27/95 [00:18<00:49, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9258, LAS: 0.8646, UEM: 0.5120, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2659, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5554, loss: 0.8987, batch_reg_loss: 0.1016, reg_loss: 0.1012 ||: 33%|###2 | 31/95 [00:20<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9272, LAS: 0.8661, UEM: 0.5207, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7525, partial_loss/deprel_loss: 0.9462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0091, loss: 0.8831, batch_reg_loss: 0.1016, reg_loss: 0.1013 ||: 36%|###5 | 34/95 [00:23<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9275, LAS: 0.8662, UEM: 0.5229, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2010, partial_loss/deprel_loss: 0.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5064, loss: 0.8833, batch_reg_loss: 0.1017, reg_loss: 0.1013 ||: 40%|#### | 38/95 [00:25<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9298, LAS: 0.8686, UEM: 0.5593, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0536, partial_loss/deprel_loss: 0.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2817, loss: 0.8655, batch_reg_loss: 0.1018, reg_loss: 0.1014 ||: 44%|####4 | 42/95 [00:28<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9312, LAS: 0.8703, UEM: 0.5728, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6638, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9371, loss: 0.8541, batch_reg_loss: 0.1019, reg_loss: 0.1014 ||: 47%|####7 | 45/95 [00:30<00:35, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9325, LAS: 0.8718, UEM: 0.5748, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.5522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.8425, batch_reg_loss: 0.1020, reg_loss: 0.1014 ||: 52%|#####1 | 49/95 [00:33<00:32, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9324, LAS: 0.8714, UEM: 0.5740, LEM: 0.3170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.4914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5446, loss: 0.8439, batch_reg_loss: 0.1020, reg_loss: 0.1015 ||: 56%|#####5 | 53/95 [00:36<00:29, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9321, LAS: 0.8710, UEM: 0.5646, LEM: 0.3081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6406, partial_loss/deprel_loss: 0.6568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7557, loss: 0.8434, batch_reg_loss: 0.1021, reg_loss: 0.1015 ||: 59%|#####8 | 56/95 [00:38<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9334, LAS: 0.8726, UEM: 0.5752, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1631, partial_loss/deprel_loss: 0.3817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4401, loss: 0.8327, batch_reg_loss: 0.1022, reg_loss: 0.1015 ||: 62%|######2 | 59/95 [00:40<00:25, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8279, UAS: 0.9339, LAS: 0.8731, UEM: 0.5878, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3192, partial_loss/deprel_loss: 1.2217, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3434, loss: 0.8309, batch_reg_loss: 0.1022, reg_loss: 0.1016 ||: 65%|######5 | 62/95 [00:43<00:24, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9332, LAS: 0.8723, UEM: 0.5816, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.6110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.8382, batch_reg_loss: 0.1023, reg_loss: 0.1016 ||: 69%|######9 | 66/95 [00:45<00:20, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9321, LAS: 0.8710, UEM: 0.5712, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0679, partial_loss/deprel_loss: 1.0180, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1303, loss: 0.8474, batch_reg_loss: 0.1023, reg_loss: 0.1016 ||: 73%|#######2 | 69/95 [00:47<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9304, LAS: 0.8692, UEM: 0.5678, LEM: 0.3159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8930, partial_loss/deprel_loss: 0.9460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0378, loss: 0.8628, batch_reg_loss: 0.1024, reg_loss: 0.1017 ||: 76%|#######5 | 72/95 [00:49<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9309, LAS: 0.8698, UEM: 0.5655, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4401, partial_loss/deprel_loss: 0.6275, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8581, batch_reg_loss: 0.1025, reg_loss: 0.1017 ||: 80%|######## | 76/95 [00:52<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.9301, LAS: 0.8687, UEM: 0.5591, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2777, partial_loss/deprel_loss: 1.1437, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2731, loss: 0.8666, batch_reg_loss: 0.1026, reg_loss: 0.1017 ||: 83%|########3 | 79/95 [00:54<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8390, UAS: 0.9290, LAS: 0.8676, UEM: 0.5500, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0951, partial_loss/deprel_loss: 0.9973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1195, loss: 0.8737, batch_reg_loss: 0.1027, reg_loss: 0.1018 ||: 87%|########7 | 83/95 [00:57<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7900, UAS: 0.9282, LAS: 0.8667, UEM: 0.5473, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7822, partial_loss/deprel_loss: 1.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4547, loss: 0.8816, batch_reg_loss: 0.1027, reg_loss: 0.1018 ||: 91%|######### | 86/95 [00:59<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9280, LAS: 0.8663, UEM: 0.5431, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9607, partial_loss/deprel_loss: 1.1209, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1917, loss: 0.8857, batch_reg_loss: 0.1028, reg_loss: 0.1019 ||: 94%|#########3| 89/95 [01:01<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9287, LAS: 0.8672, UEM: 0.5497, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5016, loss: 0.8794, batch_reg_loss: 0.1029, reg_loss: 0.1019 ||: 97%|#########6| 92/95 [01:03<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9292, LAS: 0.8676, UEM: 0.5475, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.8607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9217, loss: 0.8774, batch_reg_loss: 0.1030, reg_loss: 0.1019 ||: 100%|##########| 95/95 [01:06<00:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9292, LAS: 0.8676, UEM: 0.5475, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.8607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9217, loss: 0.8774, batch_reg_loss: 0.1030, reg_loss: 0.1019 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - reg_loss | 0.102 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - UEM | 0.547 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - LEM | 0.295 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EM | 0.869 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.651 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.861 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - loss | 0.877 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - LAS | 0.868 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:13,790 - INFO - combo.training.trainer - Epoch duration: 0:01:06.040844\n", + "2023-04-06 23:21:13,790 - INFO - combo.training.trainer - Estimated training time remaining: 7:00:10\n", + "2023-04-06 23:21:13,790 - INFO - allennlp.training.trainer - Epoch 28/399\n", + "2023-04-06 23:21:13,790 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:21:13,791 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:21:13,797 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9346, LAS: 0.8735, UEM: 0.6326, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5411, loss: 0.8077, batch_reg_loss: 0.1030, reg_loss: 0.1030 ||: 3%|3 | 3/95 [00:02<01:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9287, LAS: 0.8674, UEM: 0.5346, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6960, partial_loss/deprel_loss: 0.7365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8315, loss: 0.8417, batch_reg_loss: 0.1031, reg_loss: 0.1030 ||: 6%|6 | 6/95 [00:04<01:06, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9345, LAS: 0.8759, UEM: 0.5972, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2194, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.7925, batch_reg_loss: 0.1032, reg_loss: 0.1031 ||: 9%|9 | 9/95 [00:06<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9365, LAS: 0.8772, UEM: 0.5851, LEM: 0.3187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8063, partial_loss/deprel_loss: 0.9712, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0415, loss: 0.7803, batch_reg_loss: 0.1033, reg_loss: 0.1031 ||: 13%|#2 | 12/95 [00:08<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.9352, LAS: 0.8757, UEM: 0.5425, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7990, partial_loss/deprel_loss: 0.8716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9604, loss: 0.8003, batch_reg_loss: 0.1033, reg_loss: 0.1032 ||: 17%|#6 | 16/95 [00:11<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9375, LAS: 0.8778, UEM: 0.5466, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.6074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7860, batch_reg_loss: 0.1034, reg_loss: 0.1032 ||: 21%|##1 | 20/95 [00:13<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9379, LAS: 0.8783, UEM: 0.5463, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5882, partial_loss/deprel_loss: 0.7416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8144, loss: 0.7834, batch_reg_loss: 0.1035, reg_loss: 0.1032 ||: 24%|##4 | 23/95 [00:15<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8387, UAS: 0.9334, LAS: 0.8734, UEM: 0.5331, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1025, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1597, loss: 0.8237, batch_reg_loss: 0.1036, reg_loss: 0.1033 ||: 27%|##7 | 26/95 [00:18<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9375, LAS: 0.8775, UEM: 0.5796, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4481, loss: 0.7905, batch_reg_loss: 0.1036, reg_loss: 0.1033 ||: 32%|###1 | 30/95 [00:20<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9390, LAS: 0.8796, UEM: 0.5881, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3049, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.7753, batch_reg_loss: 0.1037, reg_loss: 0.1034 ||: 36%|###5 | 34/95 [00:23<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9383, LAS: 0.8791, UEM: 0.5771, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4137, partial_loss/deprel_loss: 0.5516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6278, loss: 0.7768, batch_reg_loss: 0.1038, reg_loss: 0.1034 ||: 39%|###8 | 37/95 [00:25<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9340, LAS: 0.8743, UEM: 0.5647, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5219, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8181, batch_reg_loss: 0.1038, reg_loss: 0.1034 ||: 42%|####2 | 40/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9351, LAS: 0.8755, UEM: 0.5681, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3436, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6062, loss: 0.8089, batch_reg_loss: 0.1039, reg_loss: 0.1035 ||: 45%|####5 | 43/95 [00:30<00:38, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9339, LAS: 0.8741, UEM: 0.5594, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3736, partial_loss/deprel_loss: 0.6634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8196, batch_reg_loss: 0.1040, reg_loss: 0.1035 ||: 49%|####9 | 47/95 [00:32<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9337, LAS: 0.8738, UEM: 0.5603, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2939, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5702, loss: 0.8231, batch_reg_loss: 0.1040, reg_loss: 0.1035 ||: 53%|#####2 | 50/95 [00:34<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9327, LAS: 0.8726, UEM: 0.5652, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9954, partial_loss/deprel_loss: 1.1214, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2003, loss: 0.8335, batch_reg_loss: 0.1041, reg_loss: 0.1036 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9328, LAS: 0.8727, UEM: 0.5670, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4666, loss: 0.8345, batch_reg_loss: 0.1042, reg_loss: 0.1036 ||: 59%|#####8 | 56/95 [00:39<00:27, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9334, LAS: 0.8734, UEM: 0.5847, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7031, partial_loss/deprel_loss: 0.9869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0344, loss: 0.8302, batch_reg_loss: 0.1042, reg_loss: 0.1036 ||: 62%|######2 | 59/95 [00:41<00:25, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9340, LAS: 0.8741, UEM: 0.5861, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2656, partial_loss/deprel_loss: 0.4323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5032, loss: 0.8227, batch_reg_loss: 0.1043, reg_loss: 0.1037 ||: 65%|######5 | 62/95 [00:43<00:23, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9343, LAS: 0.8742, UEM: 0.5832, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2923, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5804, loss: 0.8244, batch_reg_loss: 0.1044, reg_loss: 0.1037 ||: 69%|######9 | 66/95 [00:45<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8361, UAS: 0.9334, LAS: 0.8731, UEM: 0.5736, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0562, partial_loss/deprel_loss: 1.0607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1642, loss: 0.8343, batch_reg_loss: 0.1045, reg_loss: 0.1037 ||: 73%|#######2 | 69/95 [00:48<00:17, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9317, LAS: 0.8714, UEM: 0.5647, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4167, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.8474, batch_reg_loss: 0.1046, reg_loss: 0.1038 ||: 77%|#######6 | 73/95 [00:50<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8362, UAS: 0.9317, LAS: 0.8713, UEM: 0.5695, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0380, partial_loss/deprel_loss: 1.0594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1598, loss: 0.8477, batch_reg_loss: 0.1046, reg_loss: 0.1038 ||: 81%|########1 | 77/95 [00:53<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9315, LAS: 0.8710, UEM: 0.5662, LEM: 0.3139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.7805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8638, loss: 0.8493, batch_reg_loss: 0.1047, reg_loss: 0.1039 ||: 85%|########5 | 81/95 [00:55<00:09, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9312, LAS: 0.8707, UEM: 0.5638, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6924, partial_loss/deprel_loss: 0.8298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9072, loss: 0.8523, batch_reg_loss: 0.1048, reg_loss: 0.1039 ||: 89%|########9 | 85/95 [00:58<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9315, LAS: 0.8709, UEM: 0.5598, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.6310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.8520, batch_reg_loss: 0.1049, reg_loss: 0.1039 ||: 93%|#########2| 88/95 [01:00<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9302, LAS: 0.8695, UEM: 0.5517, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0410, partial_loss/deprel_loss: 0.9326, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0593, loss: 0.8626, batch_reg_loss: 0.1050, reg_loss: 0.1040 ||: 97%|#########6| 92/95 [01:03<00:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9294, LAS: 0.8688, UEM: 0.5463, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7954, partial_loss/deprel_loss: 0.8031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9066, loss: 0.8690, batch_reg_loss: 0.1050, reg_loss: 0.1040 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - reg_loss | 0.104 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - UEM | 0.546 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - LEM | 0.299 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EM | 0.861 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.795 | N/A\n", + "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.803 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - loss | 0.869 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - LAS | 0.869 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:18,870 - INFO - combo.training.trainer - Epoch duration: 0:01:05.079751\n", + "2023-04-06 23:22:18,870 - INFO - combo.training.trainer - Estimated training time remaining: 6:58:28\n", + "2023-04-06 23:22:18,870 - INFO - allennlp.training.trainer - Epoch 29/399\n", + "2023-04-06 23:22:18,870 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:22:18,871 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:22:18,878 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9405, LAS: 0.8823, UEM: 0.5759, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.8253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8819, loss: 0.7942, batch_reg_loss: 0.1051, reg_loss: 0.1051 ||: 4%|4 | 4/95 [00:02<00:55, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9405, LAS: 0.8816, UEM: 0.5821, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9805, partial_loss/deprel_loss: 0.9054, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0257, loss: 0.7758, batch_reg_loss: 0.1052, reg_loss: 0.1051 ||: 7%|7 | 7/95 [00:04<00:58, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9302, LAS: 0.8717, UEM: 0.5302, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6033, loss: 0.8529, batch_reg_loss: 0.1053, reg_loss: 0.1052 ||: 12%|#1 | 11/95 [00:07<00:54, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9260, LAS: 0.8661, UEM: 0.5289, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6318, loss: 0.8873, batch_reg_loss: 0.1053, reg_loss: 0.1052 ||: 15%|#4 | 14/95 [00:09<00:55, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9275, LAS: 0.8671, UEM: 0.5159, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0340, partial_loss/deprel_loss: 0.9651, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0843, loss: 0.8791, batch_reg_loss: 0.1054, reg_loss: 0.1053 ||: 19%|#8 | 18/95 [00:12<00:51, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9315, LAS: 0.8715, UEM: 0.5550, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2981, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.8402, batch_reg_loss: 0.1055, reg_loss: 0.1053 ||: 22%|##2 | 21/95 [00:14<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9280, LAS: 0.8674, UEM: 0.5284, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6160, partial_loss/deprel_loss: 0.7219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8063, loss: 0.8731, batch_reg_loss: 0.1056, reg_loss: 0.1053 ||: 25%|##5 | 24/95 [00:16<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9277, LAS: 0.8663, UEM: 0.4999, LEM: 0.2436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5052, partial_loss/deprel_loss: 0.7323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7925, loss: 0.8844, batch_reg_loss: 0.1057, reg_loss: 0.1054 ||: 29%|##9 | 28/95 [00:18<00:44, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9291, LAS: 0.8684, UEM: 0.5310, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.7332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8018, loss: 0.8681, batch_reg_loss: 0.1057, reg_loss: 0.1054 ||: 33%|###2 | 31/95 [00:20<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9309, LAS: 0.8711, UEM: 0.5795, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0689, partial_loss/deprel_loss: 0.9747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0993, loss: 0.8510, batch_reg_loss: 0.1058, reg_loss: 0.1054 ||: 36%|###5 | 34/95 [00:23<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9288, LAS: 0.8687, UEM: 0.5669, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9300, partial_loss/deprel_loss: 0.9667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0652, loss: 0.8740, batch_reg_loss: 0.1059, reg_loss: 0.1055 ||: 39%|###8 | 37/95 [00:25<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9303, LAS: 0.8708, UEM: 0.5728, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.4225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4842, loss: 0.8581, batch_reg_loss: 0.1059, reg_loss: 0.1055 ||: 42%|####2 | 40/95 [00:27<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9324, LAS: 0.8733, UEM: 0.5812, LEM: 0.3390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3429, partial_loss/deprel_loss: 0.5983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6532, loss: 0.8376, batch_reg_loss: 0.1060, reg_loss: 0.1055 ||: 46%|####6 | 44/95 [00:30<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9312, LAS: 0.8722, UEM: 0.5699, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4785, partial_loss/deprel_loss: 0.6576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7279, loss: 0.8446, batch_reg_loss: 0.1061, reg_loss: 0.1056 ||: 51%|##### | 48/95 [00:33<00:33, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9314, LAS: 0.8722, UEM: 0.5611, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.7489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8229, loss: 0.8442, batch_reg_loss: 0.1062, reg_loss: 0.1056 ||: 54%|#####3 | 51/95 [00:35<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9304, LAS: 0.8710, UEM: 0.5544, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3823, partial_loss/deprel_loss: 1.1230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2811, loss: 0.8544, batch_reg_loss: 0.1062, reg_loss: 0.1056 ||: 57%|#####6 | 54/95 [00:37<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9306, LAS: 0.8711, UEM: 0.5548, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2805, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.8514, batch_reg_loss: 0.1063, reg_loss: 0.1057 ||: 60%|###### | 57/95 [00:39<00:27, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9310, LAS: 0.8713, UEM: 0.5602, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3802, partial_loss/deprel_loss: 0.6500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7024, loss: 0.8500, batch_reg_loss: 0.1063, reg_loss: 0.1057 ||: 63%|######3 | 60/95 [00:41<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8057, UAS: 0.9302, LAS: 0.8704, UEM: 0.5490, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6765, partial_loss/deprel_loss: 1.2324, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4277, loss: 0.8589, batch_reg_loss: 0.1064, reg_loss: 0.1058 ||: 67%|######7 | 64/95 [00:44<00:20, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9303, LAS: 0.8706, UEM: 0.5485, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5443, partial_loss/deprel_loss: 0.6740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 0.8559, batch_reg_loss: 0.1065, reg_loss: 0.1058 ||: 71%|####### | 67/95 [00:46<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9307, LAS: 0.8712, UEM: 0.5517, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5476, partial_loss/deprel_loss: 0.7697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8318, loss: 0.8514, batch_reg_loss: 0.1066, reg_loss: 0.1058 ||: 74%|#######3 | 70/95 [00:48<00:17, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9311, LAS: 0.8715, UEM: 0.5508, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4542, partial_loss/deprel_loss: 0.5922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6712, loss: 0.8487, batch_reg_loss: 0.1066, reg_loss: 0.1059 ||: 77%|#######6 | 73/95 [00:51<00:16, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9302, LAS: 0.8703, UEM: 0.5410, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5016, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7189, loss: 0.8583, batch_reg_loss: 0.1067, reg_loss: 0.1059 ||: 81%|########1 | 77/95 [00:53<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9304, LAS: 0.8706, UEM: 0.5378, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7016, partial_loss/deprel_loss: 0.8249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9071, loss: 0.8573, batch_reg_loss: 0.1068, reg_loss: 0.1059 ||: 84%|########4 | 80/95 [00:55<00:10, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9299, LAS: 0.8699, UEM: 0.5320, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6495, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8828, loss: 0.8622, batch_reg_loss: 0.1068, reg_loss: 0.1060 ||: 87%|########7 | 83/95 [00:57<00:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9300, LAS: 0.8701, UEM: 0.5276, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.5973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6527, loss: 0.8619, batch_reg_loss: 0.1069, reg_loss: 0.1060 ||: 92%|#########1| 87/95 [01:00<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9301, LAS: 0.8702, UEM: 0.5347, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4250, loss: 0.8602, batch_reg_loss: 0.1070, reg_loss: 0.1060 ||: 95%|#########4| 90/95 [01:03<00:03, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9307, LAS: 0.8709, UEM: 0.5418, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6193, partial_loss/deprel_loss: 0.8146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8826, loss: 0.8549, batch_reg_loss: 0.1071, reg_loss: 0.1061 ||: 98%|#########7| 93/95 [01:05<00:01, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9309, LAS: 0.8709, UEM: 0.5424, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2886, partial_loss/deprel_loss: 0.5511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.8538, batch_reg_loss: 0.1071, reg_loss: 0.1061 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - reg_loss | 0.106 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UEM | 0.542 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - LEM | 0.296 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EM | 0.893 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.289 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UAS | 0.931 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.551 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - loss | 0.854 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - LAS | 0.871 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:23:25,680 - INFO - combo.training.trainer - Epoch duration: 0:01:06.809689\n", + "2023-04-06 23:23:25,680 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:10\n", + "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - Epoch 30/399\n", + "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:23:25,687 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9485, LAS: 0.8883, UEM: 0.6172, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2032, partial_loss/deprel_loss: 0.4108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4765, loss: 0.6787, batch_reg_loss: 0.1072, reg_loss: 0.1071 ||: 3%|3 | 3/95 [00:02<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8077, UAS: 0.9325, LAS: 0.8739, UEM: 0.5788, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4854, partial_loss/deprel_loss: 1.1183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2989, loss: 0.8021, batch_reg_loss: 0.1072, reg_loss: 0.1072 ||: 6%|6 | 6/95 [00:04<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9219, LAS: 0.8624, UEM: 0.5396, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0344, partial_loss/deprel_loss: 1.3158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5668, loss: 0.8970, batch_reg_loss: 0.1073, reg_loss: 0.1072 ||: 11%|# | 10/95 [00:06<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8236, UAS: 0.9129, LAS: 0.8517, UEM: 0.4775, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1380, partial_loss/deprel_loss: 1.0848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2028, loss: 0.9815, batch_reg_loss: 0.1074, reg_loss: 0.1072 ||: 14%|#3 | 13/95 [00:09<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9162, LAS: 0.8554, UEM: 0.4791, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9552, partial_loss/deprel_loss: 0.8739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9976, loss: 0.9576, batch_reg_loss: 0.1074, reg_loss: 0.1073 ||: 17%|#6 | 16/95 [00:11<00:58, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9234, LAS: 0.8629, UEM: 0.5195, LEM: 0.2770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3310, partial_loss/deprel_loss: 0.5365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6029, loss: 0.9025, batch_reg_loss: 0.1075, reg_loss: 0.1073 ||: 21%|##1 | 20/95 [00:14<00:55, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9275, LAS: 0.8668, UEM: 0.5569, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1406, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4202, loss: 0.8713, batch_reg_loss: 0.1076, reg_loss: 0.1073 ||: 24%|##4 | 23/95 [00:16<00:52, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9298, LAS: 0.8694, UEM: 0.5545, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.5630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6095, loss: 0.8538, batch_reg_loss: 0.1077, reg_loss: 0.1074 ||: 27%|##7 | 26/95 [00:18<00:49, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9318, LAS: 0.8718, UEM: 0.5587, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4433, partial_loss/deprel_loss: 0.6041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.8347, batch_reg_loss: 0.1077, reg_loss: 0.1074 ||: 32%|###1 | 30/95 [00:21<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9319, LAS: 0.8721, UEM: 0.5770, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7107, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8727, loss: 0.8302, batch_reg_loss: 0.1078, reg_loss: 0.1075 ||: 35%|###4 | 33/95 [00:23<00:44, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9326, LAS: 0.8732, UEM: 0.5866, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3633, partial_loss/deprel_loss: 0.5928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6547, loss: 0.8227, batch_reg_loss: 0.1079, reg_loss: 0.1075 ||: 38%|###7 | 36/95 [00:26<00:44, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9322, LAS: 0.8728, UEM: 0.5688, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.6978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7724, loss: 0.8291, batch_reg_loss: 0.1079, reg_loss: 0.1075 ||: 42%|####2 | 40/95 [00:28<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9310, LAS: 0.8717, UEM: 0.5667, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2758, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.8379, batch_reg_loss: 0.1080, reg_loss: 0.1076 ||: 45%|####5 | 43/95 [00:31<00:38, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9312, LAS: 0.8718, UEM: 0.5623, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.8358, batch_reg_loss: 0.1080, reg_loss: 0.1076 ||: 48%|####8 | 46/95 [00:33<00:35, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9322, LAS: 0.8732, UEM: 0.5874, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 0.6406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7188, loss: 0.8241, batch_reg_loss: 0.1081, reg_loss: 0.1076 ||: 52%|#####1 | 49/95 [00:35<00:36, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9321, LAS: 0.8729, UEM: 0.5790, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6182, partial_loss/deprel_loss: 0.7551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8359, loss: 0.8273, batch_reg_loss: 0.1082, reg_loss: 0.1077 ||: 56%|#####5 | 53/95 [00:38<00:30, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9317, LAS: 0.8724, UEM: 0.5672, LEM: 0.3272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8537, loss: 0.8331, batch_reg_loss: 0.1083, reg_loss: 0.1077 ||: 60%|###### | 57/95 [00:40<00:26, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9317, LAS: 0.8721, UEM: 0.5641, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5027, partial_loss/deprel_loss: 0.6883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.8379, batch_reg_loss: 0.1084, reg_loss: 0.1077 ||: 64%|######4 | 61/95 [00:43<00:22, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9305, LAS: 0.8704, UEM: 0.5515, LEM: 0.3111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6451, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9549, loss: 0.8522, batch_reg_loss: 0.1084, reg_loss: 0.1078 ||: 68%|######8 | 65/95 [00:45<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9315, LAS: 0.8714, UEM: 0.5530, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.5400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5980, loss: 0.8460, batch_reg_loss: 0.1085, reg_loss: 0.1078 ||: 73%|#######2 | 69/95 [00:48<00:17, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9325, LAS: 0.8724, UEM: 0.5549, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.5391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5974, loss: 0.8382, batch_reg_loss: 0.1086, reg_loss: 0.1079 ||: 77%|#######6 | 73/95 [00:51<00:14, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9322, LAS: 0.8720, UEM: 0.5487, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6038, partial_loss/deprel_loss: 0.7871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8591, loss: 0.8423, batch_reg_loss: 0.1087, reg_loss: 0.1079 ||: 81%|########1 | 77/95 [00:53<00:11, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8324, UAS: 0.9292, LAS: 0.8688, UEM: 0.5399, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3246, partial_loss/deprel_loss: 0.9912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1667, loss: 0.8666, batch_reg_loss: 0.1088, reg_loss: 0.1080 ||: 85%|########5 | 81/95 [00:56<00:08, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9303, LAS: 0.8701, UEM: 0.5412, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4508, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7081, loss: 0.8578, batch_reg_loss: 0.1089, reg_loss: 0.1080 ||: 89%|########9 | 85/95 [00:58<00:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9302, LAS: 0.8701, UEM: 0.5400, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1560, partial_loss/deprel_loss: 1.0515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1814, loss: 0.8587, batch_reg_loss: 0.1090, reg_loss: 0.1080 ||: 94%|#########3| 89/95 [01:01<00:03, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.9308, LAS: 0.8708, UEM: 0.5543, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3766, partial_loss/deprel_loss: 1.1223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2822, loss: 0.8519, batch_reg_loss: 0.1091, reg_loss: 0.1081 ||: 98%|#########7| 93/95 [01:04<00:01, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9304, LAS: 0.8703, UEM: 0.5497, LEM: 0.2994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0909, partial_loss/deprel_loss: 1.0622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1771, loss: 0.8557, batch_reg_loss: 0.1091, reg_loss: 0.1081 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-06 23:24:31,061 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9493, LAS: 0.8889, UEM: 0.5691, LEM: 0.1780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4038, partial_loss/deprel_loss: 28.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 22.5808, loss: 22.6030, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:06, 1.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9441, LAS: 0.8850, UEM: 0.5694, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2868, partial_loss/deprel_loss: 27.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 21.9448, loss: 27.0188, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9383, LAS: 0.8790, UEM: 0.4910, LEM: 0.1820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 42.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 34.4852, loss: 28.7889, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9470, LAS: 0.8918, UEM: 0.6641, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 22.0492, partial_loss/cycle_loss: 0.0000, batch_loss: 17.6823, loss: 25.6736, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9470, LAS: 0.8918, UEM: 0.6641, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 22.0492, partial_loss/cycle_loss: 0.0000, batch_loss: 17.6823, loss: 25.6736, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "2023-04-06 23:24:41,625 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - reg_loss | 0.108 | 0.000\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - UEM | 0.550 | 0.664\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - LEM | 0.299 | 0.384\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EM | 0.832 | 0.927\n", + "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.091 | 0.214\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | 0.947\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.062 | 22.049\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - loss | 0.856 | 25.674\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - LAS | 0.870 | 0.892\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:41,628 - INFO - combo.training.trainer - Epoch duration: 0:01:15.948043\n", + "2023-04-06 23:24:41,628 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:41\n", + "2023-04-06 23:24:41,628 - INFO - allennlp.training.trainer - Epoch 31/399\n", + "2023-04-06 23:24:41,628 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:24:41,629 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:24:41,636 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9554, LAS: 0.8921, UEM: 0.6602, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3671, partial_loss/deprel_loss: 0.6465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 0.6303, batch_reg_loss: 0.1092, reg_loss: 0.1091 ||: 3%|3 | 3/95 [00:02<01:12, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9520, LAS: 0.8914, UEM: 0.6391, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4923, partial_loss/deprel_loss: 0.7018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7691, loss: 0.6716, batch_reg_loss: 0.1092, reg_loss: 0.1092 ||: 7%|7 | 7/95 [00:05<01:06, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9453, LAS: 0.8853, UEM: 0.5792, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7182, partial_loss/deprel_loss: 0.7852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8811, loss: 0.7250, batch_reg_loss: 0.1093, reg_loss: 0.1092 ||: 12%|#1 | 11/95 [00:07<00:59, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9388, LAS: 0.8788, UEM: 0.5190, LEM: 0.2554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9456, partial_loss/deprel_loss: 0.8558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9832, loss: 0.7850, batch_reg_loss: 0.1094, reg_loss: 0.1093 ||: 16%|#5 | 15/95 [00:10<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9360, LAS: 0.8756, UEM: 0.5046, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5136, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.8117, batch_reg_loss: 0.1095, reg_loss: 0.1093 ||: 20%|## | 19/95 [00:12<00:51, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9332, LAS: 0.8718, UEM: 0.4720, LEM: 0.2205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1145, partial_loss/deprel_loss: 1.1053, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2167, loss: 0.8445, batch_reg_loss: 0.1096, reg_loss: 0.1094 ||: 24%|##4 | 23/95 [00:15<00:46, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9323, LAS: 0.8711, UEM: 0.4599, LEM: 0.2114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.5635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6431, loss: 0.8527, batch_reg_loss: 0.1097, reg_loss: 0.1094 ||: 27%|##7 | 26/95 [00:17<00:45, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8258, UAS: 0.9323, LAS: 0.8707, UEM: 0.4526, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2397, partial_loss/deprel_loss: 1.0853, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2260, loss: 0.8561, batch_reg_loss: 0.1098, reg_loss: 0.1094 ||: 32%|###1 | 30/95 [00:19<00:43, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9332, LAS: 0.8717, UEM: 0.4648, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5229, partial_loss/deprel_loss: 0.7206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7909, loss: 0.8484, batch_reg_loss: 0.1098, reg_loss: 0.1095 ||: 35%|###4 | 33/95 [00:21<00:41, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9322, LAS: 0.8707, UEM: 0.4506, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4654, partial_loss/deprel_loss: 0.6659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.8623, batch_reg_loss: 0.1099, reg_loss: 0.1095 ||: 39%|###8 | 37/95 [00:24<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9307, LAS: 0.8692, UEM: 0.4356, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8833, loss: 0.8725, batch_reg_loss: 0.1100, reg_loss: 0.1095 ||: 42%|####2 | 40/95 [00:26<00:37, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9296, LAS: 0.8678, UEM: 0.4272, LEM: 0.1879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5058, partial_loss/deprel_loss: 0.7003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.8843, batch_reg_loss: 0.1101, reg_loss: 0.1096 ||: 45%|####5 | 43/95 [00:28<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9295, LAS: 0.8681, UEM: 0.4315, LEM: 0.1898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2709, partial_loss/deprel_loss: 1.0338, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1913, loss: 0.8818, batch_reg_loss: 0.1101, reg_loss: 0.1096 ||: 48%|####8 | 46/95 [00:31<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8474, UAS: 0.9283, LAS: 0.8667, UEM: 0.4210, LEM: 0.1832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8996, partial_loss/deprel_loss: 0.9643, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0616, loss: 0.8929, batch_reg_loss: 0.1102, reg_loss: 0.1096 ||: 52%|#####1 | 49/95 [00:33<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9301, LAS: 0.8692, UEM: 0.4763, LEM: 0.2466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4993, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8411, loss: 0.8742, batch_reg_loss: 0.1103, reg_loss: 0.1097 ||: 55%|#####4 | 52/95 [00:35<00:32, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8096, UAS: 0.9290, LAS: 0.8679, UEM: 0.4825, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5268, partial_loss/deprel_loss: 1.2334, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4024, loss: 0.8846, batch_reg_loss: 0.1103, reg_loss: 0.1097 ||: 58%|#####7 | 55/95 [00:37<00:29, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9300, LAS: 0.8691, UEM: 0.4876, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3654, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.8741, batch_reg_loss: 0.1104, reg_loss: 0.1098 ||: 62%|######2 | 59/95 [00:40<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9287, LAS: 0.8678, UEM: 0.4850, LEM: 0.2498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3838, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.8828, batch_reg_loss: 0.1105, reg_loss: 0.1098 ||: 65%|######5 | 62/95 [00:42<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9287, LAS: 0.8679, UEM: 0.4826, LEM: 0.2463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2953, partial_loss/deprel_loss: 0.4981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5681, loss: 0.8820, batch_reg_loss: 0.1106, reg_loss: 0.1098 ||: 69%|######9 | 66/95 [00:45<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9300, LAS: 0.8695, UEM: 0.5009, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.4462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5186, loss: 0.8702, batch_reg_loss: 0.1107, reg_loss: 0.1099 ||: 73%|#######2 | 69/95 [00:47<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9294, LAS: 0.8688, UEM: 0.5009, LEM: 0.2610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6164, partial_loss/deprel_loss: 0.7282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8166, loss: 0.8738, batch_reg_loss: 0.1107, reg_loss: 0.1099 ||: 77%|#######6 | 73/95 [00:49<00:14, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9307, LAS: 0.8707, UEM: 0.5151, LEM: 0.2706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.4397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5286, loss: 0.8588, batch_reg_loss: 0.1108, reg_loss: 0.1100 ||: 81%|########1 | 77/95 [00:52<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9316, LAS: 0.8717, UEM: 0.5285, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.8500, batch_reg_loss: 0.1109, reg_loss: 0.1100 ||: 84%|########4 | 80/95 [00:54<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8129, UAS: 0.9313, LAS: 0.8716, UEM: 0.5363, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3228, partial_loss/deprel_loss: 1.0582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2221, loss: 0.8503, batch_reg_loss: 0.1110, reg_loss: 0.1100 ||: 88%|########8 | 84/95 [00:57<00:07, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9315, LAS: 0.8718, UEM: 0.5368, LEM: 0.2930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2220, partial_loss/deprel_loss: 1.0879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2257, loss: 0.8498, batch_reg_loss: 0.1110, reg_loss: 0.1101 ||: 93%|#########2| 88/95 [00:59<00:04, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9328, LAS: 0.8732, UEM: 0.5466, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6342, loss: 0.8388, batch_reg_loss: 0.1111, reg_loss: 0.1101 ||: 97%|#########6| 92/95 [01:02<00:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9323, LAS: 0.8726, UEM: 0.5503, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1446, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4271, loss: 0.8418, batch_reg_loss: 0.1112, reg_loss: 0.1102 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - reg_loss | 0.110 | N/A\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - UEM | 0.550 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LEM | 0.303 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - EM | 0.921 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.145 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.359 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - loss | 0.842 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LAS | 0.873 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.596 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:45,953 - INFO - combo.training.trainer - Epoch duration: 0:01:04.324762\n", + "2023-04-06 23:25:45,953 - INFO - combo.training.trainer - Estimated training time remaining: 6:55:52\n", + "2023-04-06 23:25:45,953 - INFO - allennlp.training.trainer - Epoch 32/399\n", + "2023-04-06 23:25:45,953 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:25:45,954 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:25:45,959 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9301, LAS: 0.8697, UEM: 0.4459, LEM: 0.2277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4560, partial_loss/deprel_loss: 0.6288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7054, loss: 0.8977, batch_reg_loss: 0.1112, reg_loss: 0.1112 ||: 4%|4 | 4/95 [00:02<01:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9292, LAS: 0.8692, UEM: 0.4227, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6525, partial_loss/deprel_loss: 0.7815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8671, loss: 0.8927, batch_reg_loss: 0.1113, reg_loss: 0.1112 ||: 8%|8 | 8/95 [00:05<00:56, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9238, LAS: 0.8639, UEM: 0.4082, LEM: 0.1875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.5976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6766, loss: 0.9322, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||: 13%|#2 | 12/95 [00:07<00:53, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9317, LAS: 0.8737, UEM: 0.5259, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3335, partial_loss/deprel_loss: 0.5011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.8531, batch_reg_loss: 0.1115, reg_loss: 0.1113 ||: 16%|#5 | 15/95 [00:09<00:52, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9319, LAS: 0.8730, UEM: 0.5110, LEM: 0.2590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7384, loss: 0.8532, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||: 20%|## | 19/95 [00:12<00:49, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9342, LAS: 0.8755, UEM: 0.5384, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1421, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4428, loss: 0.8315, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||: 24%|##4 | 23/95 [00:14<00:46, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9353, LAS: 0.8765, UEM: 0.5362, LEM: 0.2757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4069, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6745, loss: 0.8210, batch_reg_loss: 0.1117, reg_loss: 0.1114 ||: 27%|##7 | 26/95 [00:17<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7829, UAS: 0.9313, LAS: 0.8721, UEM: 0.5203, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9171, partial_loss/deprel_loss: 1.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5404, loss: 0.8508, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||: 31%|### | 29/95 [00:19<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9340, LAS: 0.8752, UEM: 0.5428, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3922, partial_loss/deprel_loss: 0.5541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.8246, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||: 34%|###3 | 32/95 [00:21<00:44, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8264, UAS: 0.9337, LAS: 0.8745, UEM: 0.5313, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2626, partial_loss/deprel_loss: 1.0762, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2253, loss: 0.8320, batch_reg_loss: 0.1119, reg_loss: 0.1115 ||: 38%|###7 | 36/95 [00:23<00:39, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9334, LAS: 0.8741, UEM: 0.5304, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.5026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5676, loss: 0.8348, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||: 41%|####1 | 39/95 [00:26<00:40, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9327, LAS: 0.8730, UEM: 0.5162, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7776, loss: 0.8433, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||: 44%|####4 | 42/95 [00:28<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9329, LAS: 0.8732, UEM: 0.5139, LEM: 0.2592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3069, partial_loss/deprel_loss: 0.5136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5843, loss: 0.8430, batch_reg_loss: 0.1121, reg_loss: 0.1116 ||: 47%|####7 | 45/95 [00:30<00:35, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.9331, LAS: 0.8734, UEM: 0.5439, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1491, partial_loss/deprel_loss: 1.0949, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2179, loss: 0.8432, batch_reg_loss: 0.1121, reg_loss: 0.1117 ||: 51%|##### | 48/95 [00:32<00:34, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9332, LAS: 0.8734, UEM: 0.5434, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 0.4329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.8439, batch_reg_loss: 0.1122, reg_loss: 0.1117 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9338, LAS: 0.8742, UEM: 0.5455, LEM: 0.3016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0053, partial_loss/deprel_loss: 0.9650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0853, loss: 0.8405, batch_reg_loss: 0.1123, reg_loss: 0.1117 ||: 58%|#####7 | 55/95 [00:37<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9324, LAS: 0.8728, UEM: 0.5294, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8218, partial_loss/deprel_loss: 0.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0561, loss: 0.8512, batch_reg_loss: 0.1124, reg_loss: 0.1118 ||: 62%|######2 | 59/95 [00:39<00:24, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9331, LAS: 0.8736, UEM: 0.5349, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1961, partial_loss/deprel_loss: 0.4335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.8452, batch_reg_loss: 0.1125, reg_loss: 0.1118 ||: 65%|######5 | 62/95 [00:42<00:22, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9335, LAS: 0.8738, UEM: 0.5307, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.5466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6071, loss: 0.8436, batch_reg_loss: 0.1125, reg_loss: 0.1119 ||: 69%|######9 | 66/95 [00:44<00:19, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8010, UAS: 0.9334, LAS: 0.8740, UEM: 0.5416, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5383, partial_loss/deprel_loss: 1.2065, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3855, loss: 0.8403, batch_reg_loss: 0.1126, reg_loss: 0.1119 ||: 74%|#######3 | 70/95 [00:47<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9331, LAS: 0.8737, UEM: 0.5406, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7620, partial_loss/deprel_loss: 0.8850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.8439, batch_reg_loss: 0.1127, reg_loss: 0.1119 ||: 77%|#######6 | 73/95 [00:49<00:14, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9328, LAS: 0.8733, UEM: 0.5343, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.6720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7566, loss: 0.8478, batch_reg_loss: 0.1127, reg_loss: 0.1120 ||: 80%|######## | 76/95 [00:51<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9316, LAS: 0.8721, UEM: 0.5348, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.4674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5322, loss: 0.8570, batch_reg_loss: 0.1128, reg_loss: 0.1120 ||: 83%|########3 | 79/95 [00:53<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9323, LAS: 0.8730, UEM: 0.5379, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4902, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7520, loss: 0.8507, batch_reg_loss: 0.1129, reg_loss: 0.1120 ||: 86%|########6 | 82/95 [00:56<00:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9326, LAS: 0.8733, UEM: 0.5386, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2232, partial_loss/deprel_loss: 0.4530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5200, loss: 0.8478, batch_reg_loss: 0.1129, reg_loss: 0.1121 ||: 89%|########9 | 85/95 [00:58<00:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9326, LAS: 0.8732, UEM: 0.5383, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6636, partial_loss/deprel_loss: 0.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8643, loss: 0.8471, batch_reg_loss: 0.1130, reg_loss: 0.1121 ||: 93%|#########2| 88/95 [01:00<00:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8125, UAS: 0.9313, LAS: 0.8716, UEM: 0.5328, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4500, partial_loss/deprel_loss: 1.1874, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3530, loss: 0.8586, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||: 96%|#########5| 91/95 [01:02<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9320, LAS: 0.8725, UEM: 0.5489, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8698, partial_loss/deprel_loss: 0.9173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0209, loss: 0.8512, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||: 99%|#########8| 94/95 [01:04<00:00, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9323, LAS: 0.8729, UEM: 0.5514, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2711, partial_loss/deprel_loss: 0.4642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.8479, batch_reg_loss: 0.1131, reg_loss: 0.1122 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - reg_loss | 0.112 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UEM | 0.551 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - LEM | 0.306 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EM | 0.908 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.271 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.464 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - loss | 0.848 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - LAS | 0.873 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:51,302 - INFO - combo.training.trainer - Epoch duration: 0:01:05.348414\n", + "2023-04-06 23:26:51,302 - INFO - combo.training.trainer - Estimated training time remaining: 6:54:17\n", + "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - Epoch 33/399\n", + "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:26:51,308 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9486, LAS: 0.8924, UEM: 0.7037, LEM: 0.4360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.4336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.6325, batch_reg_loss: 0.1132, reg_loss: 0.1132 ||: 3%|3 | 3/95 [00:02<01:11, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9275, LAS: 0.8681, UEM: 0.5495, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8843, partial_loss/deprel_loss: 0.8701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9862, loss: 0.8366, batch_reg_loss: 0.1133, reg_loss: 0.1132 ||: 7%|7 | 7/95 [00:04<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7927, UAS: 0.9251, LAS: 0.8656, UEM: 0.5293, LEM: 0.2882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7105, partial_loss/deprel_loss: 1.2121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4251, loss: 0.8632, batch_reg_loss: 0.1133, reg_loss: 0.1132 ||: 11%|# | 10/95 [00:06<01:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9341, LAS: 0.8756, UEM: 0.6130, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1157, partial_loss/deprel_loss: 0.3530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4190, loss: 0.7885, batch_reg_loss: 0.1134, reg_loss: 0.1133 ||: 14%|#3 | 13/95 [00:09<01:01, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9371, LAS: 0.8785, UEM: 0.6068, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6198, partial_loss/deprel_loss: 0.7161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8103, loss: 0.7708, batch_reg_loss: 0.1135, reg_loss: 0.1133 ||: 17%|#6 | 16/95 [00:11<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9419, LAS: 0.8848, UEM: 0.6580, LEM: 0.3863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.4466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.7275, batch_reg_loss: 0.1135, reg_loss: 0.1133 ||: 20%|## | 19/95 [00:13<00:57, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9369, LAS: 0.8787, UEM: 0.6148, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9499, partial_loss/deprel_loss: 0.9590, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0708, loss: 0.7791, batch_reg_loss: 0.1136, reg_loss: 0.1134 ||: 24%|##4 | 23/95 [00:16<00:51, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9355, LAS: 0.8764, UEM: 0.5868, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.6071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6651, loss: 0.8012, batch_reg_loss: 0.1137, reg_loss: 0.1134 ||: 28%|##8 | 27/95 [00:18<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9343, LAS: 0.8750, UEM: 0.5813, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2071, partial_loss/deprel_loss: 1.0966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2324, loss: 0.8155, batch_reg_loss: 0.1137, reg_loss: 0.1134 ||: 32%|###1 | 30/95 [00:21<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9336, LAS: 0.8742, UEM: 0.5707, LEM: 0.3162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4102, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.8187, batch_reg_loss: 0.1138, reg_loss: 0.1135 ||: 35%|###4 | 33/95 [00:23<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9355, LAS: 0.8767, UEM: 0.5810, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3768, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.8022, batch_reg_loss: 0.1138, reg_loss: 0.1135 ||: 38%|###7 | 36/95 [00:25<00:43, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8634, UAS: 0.9352, LAS: 0.8765, UEM: 0.5675, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7297, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9423, loss: 0.8053, batch_reg_loss: 0.1139, reg_loss: 0.1135 ||: 41%|####1 | 39/95 [00:27<00:40, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9338, LAS: 0.8749, UEM: 0.5621, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2653, partial_loss/deprel_loss: 0.5660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.8215, batch_reg_loss: 0.1140, reg_loss: 0.1136 ||: 44%|####4 | 42/95 [00:29<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9320, LAS: 0.8728, UEM: 0.5448, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8942, partial_loss/deprel_loss: 0.9231, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0313, loss: 0.8381, batch_reg_loss: 0.1141, reg_loss: 0.1136 ||: 48%|####8 | 46/95 [00:31<00:32, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8354, UAS: 0.9327, LAS: 0.8732, UEM: 0.5526, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1232, partial_loss/deprel_loss: 1.0909, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2115, loss: 0.8358, batch_reg_loss: 0.1141, reg_loss: 0.1136 ||: 53%|#####2 | 50/95 [00:34<00:30, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9309, LAS: 0.8713, UEM: 0.5454, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1690, partial_loss/deprel_loss: 0.9704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1244, loss: 0.8545, batch_reg_loss: 0.1142, reg_loss: 0.1137 ||: 57%|#####6 | 54/95 [00:37<00:27, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9310, LAS: 0.8713, UEM: 0.5375, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4611, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7114, loss: 0.8543, batch_reg_loss: 0.1143, reg_loss: 0.1137 ||: 61%|######1 | 58/95 [00:39<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9307, LAS: 0.8712, UEM: 0.5276, LEM: 0.2754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0411, partial_loss/deprel_loss: 0.9490, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0818, loss: 0.8585, batch_reg_loss: 0.1144, reg_loss: 0.1138 ||: 65%|######5 | 62/95 [00:42<00:21, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9291, LAS: 0.8694, UEM: 0.5234, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2625, partial_loss/deprel_loss: 1.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7944, loss: 0.8754, batch_reg_loss: 0.1145, reg_loss: 0.1138 ||: 69%|######9 | 66/95 [00:45<00:18, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9305, LAS: 0.8709, UEM: 0.5339, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3025, partial_loss/deprel_loss: 0.5761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.8629, batch_reg_loss: 0.1146, reg_loss: 0.1139 ||: 74%|#######3 | 70/95 [00:47<00:15, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9320, LAS: 0.8724, UEM: 0.5526, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2794, partial_loss/deprel_loss: 0.4444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5261, loss: 0.8488, batch_reg_loss: 0.1147, reg_loss: 0.1139 ||: 78%|#######7 | 74/95 [00:50<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9328, LAS: 0.8733, UEM: 0.5528, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4616, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6955, loss: 0.8418, batch_reg_loss: 0.1148, reg_loss: 0.1139 ||: 82%|########2 | 78/95 [00:52<00:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9323, LAS: 0.8727, UEM: 0.5434, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.6636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7486, loss: 0.8450, batch_reg_loss: 0.1148, reg_loss: 0.1140 ||: 86%|########6 | 82/95 [00:55<00:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9326, LAS: 0.8728, UEM: 0.5411, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7292, partial_loss/deprel_loss: 0.9182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9953, loss: 0.8444, batch_reg_loss: 0.1149, reg_loss: 0.1140 ||: 91%|######### | 86/95 [00:58<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7848, UAS: 0.9314, LAS: 0.8716, UEM: 0.5342, LEM: 0.2754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8967, partial_loss/deprel_loss: 1.2783, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5170, loss: 0.8545, batch_reg_loss: 0.1150, reg_loss: 0.1141 ||: 95%|#########4| 90/95 [01:01<00:03, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9317, LAS: 0.8721, UEM: 0.5383, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3309, partial_loss/deprel_loss: 0.5393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6127, loss: 0.8494, batch_reg_loss: 0.1151, reg_loss: 0.1141 ||: 98%|#########7| 93/95 [01:03<00:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9323, LAS: 0.8730, UEM: 0.5542, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0884, partial_loss/deprel_loss: 0.2159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3055, loss: 0.8428, batch_reg_loss: 0.1151, reg_loss: 0.1141 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - reg_loss | 0.114 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - UEM | 0.554 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - LEM | 0.301 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EM | 0.947 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.088 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.216 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - loss | 0.843 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - LAS | 0.873 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:56,392 - INFO - combo.training.trainer - Epoch duration: 0:01:05.090000\n", + "2023-04-06 23:27:56,392 - INFO - combo.training.trainer - Estimated training time remaining: 6:52:40\n", + "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - Epoch 34/399\n", + "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:27:56,399 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9454, LAS: 0.8897, UEM: 0.5625, LEM: 0.2768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5273, loss: 0.6903, batch_reg_loss: 0.1152, reg_loss: 0.1151 ||: 3%|3 | 3/95 [00:02<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9508, LAS: 0.8929, UEM: 0.5816, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3096, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6136, loss: 0.6771, batch_reg_loss: 0.1152, reg_loss: 0.1152 ||: 6%|6 | 6/95 [00:04<01:07, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8149, UAS: 0.9394, LAS: 0.8797, UEM: 0.5386, LEM: 0.2403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4532, partial_loss/deprel_loss: 1.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2743, loss: 0.7823, batch_reg_loss: 0.1153, reg_loss: 0.1152 ||: 9%|9 | 9/95 [00:06<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9356, LAS: 0.8751, UEM: 0.5214, LEM: 0.2343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.5428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5978, loss: 0.8289, batch_reg_loss: 0.1153, reg_loss: 0.1152 ||: 13%|#2 | 12/95 [00:08<00:59, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9389, LAS: 0.8795, UEM: 0.5678, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2516, partial_loss/deprel_loss: 0.4979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5640, loss: 0.7939, batch_reg_loss: 0.1154, reg_loss: 0.1153 ||: 16%|#5 | 15/95 [00:10<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9348, LAS: 0.8752, UEM: 0.5681, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3626, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6350, loss: 0.8295, batch_reg_loss: 0.1155, reg_loss: 0.1153 ||: 20%|## | 19/95 [00:13<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9346, LAS: 0.8753, UEM: 0.5636, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.4340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.8377, batch_reg_loss: 0.1156, reg_loss: 0.1153 ||: 24%|##4 | 23/95 [00:16<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9337, LAS: 0.8742, UEM: 0.5384, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9168, partial_loss/deprel_loss: 0.8650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9910, loss: 0.8480, batch_reg_loss: 0.1156, reg_loss: 0.1154 ||: 28%|##8 | 27/95 [00:18<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9311, LAS: 0.8712, UEM: 0.5121, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0191, partial_loss/deprel_loss: 1.0519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1611, loss: 0.8715, batch_reg_loss: 0.1157, reg_loss: 0.1154 ||: 33%|###2 | 31/95 [00:21<00:41, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9323, LAS: 0.8731, UEM: 0.5610, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0757, partial_loss/deprel_loss: 0.1835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2778, loss: 0.8571, batch_reg_loss: 0.1158, reg_loss: 0.1155 ||: 37%|###6 | 35/95 [00:24<00:43, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9323, LAS: 0.8734, UEM: 0.5630, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7922, partial_loss/deprel_loss: 0.7743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8938, loss: 0.8563, batch_reg_loss: 0.1159, reg_loss: 0.1155 ||: 40%|#### | 38/95 [00:27<00:42, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9324, LAS: 0.8735, UEM: 0.5549, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6392, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8349, loss: 0.8536, batch_reg_loss: 0.1160, reg_loss: 0.1155 ||: 43%|####3 | 41/95 [00:29<00:39, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9329, LAS: 0.8741, UEM: 0.5491, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6518, loss: 0.8504, batch_reg_loss: 0.1160, reg_loss: 0.1156 ||: 46%|####6 | 44/95 [00:31<00:36, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9322, LAS: 0.8733, UEM: 0.5394, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6864, partial_loss/deprel_loss: 0.8533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9360, loss: 0.8589, batch_reg_loss: 0.1161, reg_loss: 0.1156 ||: 49%|####9 | 47/95 [00:33<00:34, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9318, LAS: 0.8731, UEM: 0.5378, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3048, partial_loss/deprel_loss: 0.4642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5485, loss: 0.8600, batch_reg_loss: 0.1162, reg_loss: 0.1156 ||: 53%|#####2 | 50/95 [00:35<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9308, LAS: 0.8725, UEM: 0.5379, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5077, loss: 0.8667, batch_reg_loss: 0.1162, reg_loss: 0.1157 ||: 56%|#####5 | 53/95 [00:37<00:30, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9318, LAS: 0.8736, UEM: 0.5398, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4101, partial_loss/deprel_loss: 0.5982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6769, loss: 0.8583, batch_reg_loss: 0.1163, reg_loss: 0.1157 ||: 59%|#####8 | 56/95 [00:40<00:28, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9318, LAS: 0.8738, UEM: 0.5579, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.4280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.8554, batch_reg_loss: 0.1163, reg_loss: 0.1157 ||: 62%|######2 | 59/95 [00:42<00:26, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9326, LAS: 0.8744, UEM: 0.5555, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5130, partial_loss/deprel_loss: 0.6787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7620, loss: 0.8500, batch_reg_loss: 0.1164, reg_loss: 0.1158 ||: 66%|######6 | 63/95 [00:44<00:22, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9323, LAS: 0.8740, UEM: 0.5542, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.4911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5659, loss: 0.8528, batch_reg_loss: 0.1165, reg_loss: 0.1158 ||: 69%|######9 | 66/95 [00:46<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9335, LAS: 0.8752, UEM: 0.5605, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4231, partial_loss/deprel_loss: 0.6362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.8413, batch_reg_loss: 0.1166, reg_loss: 0.1158 ||: 74%|#######3 | 70/95 [00:49<00:17, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9339, LAS: 0.8756, UEM: 0.5551, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.5605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6454, loss: 0.8376, batch_reg_loss: 0.1167, reg_loss: 0.1159 ||: 78%|#######7 | 74/95 [00:52<00:14, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9341, LAS: 0.8758, UEM: 0.5480, LEM: 0.2983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6369, partial_loss/deprel_loss: 0.7233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8228, loss: 0.8353, batch_reg_loss: 0.1167, reg_loss: 0.1159 ||: 82%|########2 | 78/95 [00:54<00:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9335, LAS: 0.8753, UEM: 0.5534, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1816, partial_loss/deprel_loss: 0.3116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4024, loss: 0.8385, batch_reg_loss: 0.1168, reg_loss: 0.1160 ||: 86%|########6 | 82/95 [00:57<00:08, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9338, LAS: 0.8754, UEM: 0.5523, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3737, partial_loss/deprel_loss: 0.6308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6962, loss: 0.8371, batch_reg_loss: 0.1169, reg_loss: 0.1160 ||: 91%|######### | 86/95 [00:59<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7668, UAS: 0.9333, LAS: 0.8749, UEM: 0.5530, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1193, partial_loss/deprel_loss: 1.3323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6066, loss: 0.8406, batch_reg_loss: 0.1170, reg_loss: 0.1160 ||: 95%|#########4| 90/95 [01:02<00:03, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9335, LAS: 0.8749, UEM: 0.5575, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1158, partial_loss/deprel_loss: 0.3491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.8389, batch_reg_loss: 0.1171, reg_loss: 0.1161 ||: 99%|#########8| 94/95 [01:05<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9332, LAS: 0.8745, UEM: 0.5553, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0379, partial_loss/deprel_loss: 0.9985, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1235, loss: 0.8419, batch_reg_loss: 0.1171, reg_loss: 0.1161 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-06 23:29:02,672 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - reg_loss | 0.116 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UEM | 0.555 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - LEM | 0.307 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EM | 0.837 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.038 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UAS | 0.933 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.999 | N/A\n", + "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - loss | 0.842 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - LAS | 0.874 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:02,675 - INFO - combo.training.trainer - Epoch duration: 0:01:06.282521\n", + "2023-04-06 23:29:02,675 - INFO - combo.training.trainer - Estimated training time remaining: 6:51:18\n", + "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - Epoch 35/399\n", + "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:29:02,682 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9328, LAS: 0.8700, UEM: 0.4015, LEM: 0.1409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 1.0499, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.8917, batch_reg_loss: 0.1172, reg_loss: 0.1171 ||: 4%|4 | 4/95 [00:02<00:56, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9388, LAS: 0.8803, UEM: 0.5021, LEM: 0.2380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6407, partial_loss/deprel_loss: 0.8017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8867, loss: 0.8298, batch_reg_loss: 0.1172, reg_loss: 0.1172 ||: 8%|8 | 8/95 [00:04<00:54, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9330, LAS: 0.8742, UEM: 0.4814, LEM: 0.2262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7000, partial_loss/deprel_loss: 0.7975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8953, loss: 0.8565, batch_reg_loss: 0.1173, reg_loss: 0.1172 ||: 13%|#2 | 12/95 [00:08<00:59, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9296, LAS: 0.8717, UEM: 0.4975, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2341, partial_loss/deprel_loss: 0.4173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4980, loss: 0.8744, batch_reg_loss: 0.1174, reg_loss: 0.1172 ||: 16%|#5 | 15/95 [00:10<00:57, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9355, LAS: 0.8785, UEM: 0.5918, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1491, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.8180, batch_reg_loss: 0.1175, reg_loss: 0.1173 ||: 19%|#8 | 18/95 [00:13<00:57, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8332, UAS: 0.9327, LAS: 0.8755, UEM: 0.5839, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1837, partial_loss/deprel_loss: 1.0341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1816, loss: 0.8458, batch_reg_loss: 0.1175, reg_loss: 0.1173 ||: 22%|##2 | 21/95 [00:15<00:53, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9330, LAS: 0.8747, UEM: 0.5557, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5207, partial_loss/deprel_loss: 0.6897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7735, loss: 0.8494, batch_reg_loss: 0.1176, reg_loss: 0.1174 ||: 26%|##6 | 25/95 [00:17<00:47, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8585, UAS: 0.9341, LAS: 0.8764, UEM: 0.5420, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8242, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9622, loss: 0.8364, batch_reg_loss: 0.1177, reg_loss: 0.1174 ||: 31%|### | 29/95 [00:20<00:43, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9352, LAS: 0.8772, UEM: 0.5393, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3497, partial_loss/deprel_loss: 0.5675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6417, loss: 0.8275, batch_reg_loss: 0.1177, reg_loss: 0.1174 ||: 34%|###3 | 32/95 [00:22<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9349, LAS: 0.8771, UEM: 0.5751, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9193, partial_loss/deprel_loss: 0.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0808, loss: 0.8269, batch_reg_loss: 0.1178, reg_loss: 0.1175 ||: 37%|###6 | 35/95 [00:24<00:44, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9314, LAS: 0.8731, UEM: 0.5634, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.6489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.8570, batch_reg_loss: 0.1179, reg_loss: 0.1175 ||: 40%|#### | 38/95 [00:27<00:40, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9312, LAS: 0.8725, UEM: 0.5498, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4005, partial_loss/deprel_loss: 0.5868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6675, loss: 0.8583, batch_reg_loss: 0.1179, reg_loss: 0.1175 ||: 44%|####4 | 42/95 [00:29<00:36, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9329, LAS: 0.8745, UEM: 0.5573, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4212, partial_loss/deprel_loss: 0.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6932, loss: 0.8438, batch_reg_loss: 0.1180, reg_loss: 0.1176 ||: 47%|####7 | 45/95 [00:31<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9329, LAS: 0.8745, UEM: 0.5568, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2502, partial_loss/deprel_loss: 0.4501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.8414, batch_reg_loss: 0.1181, reg_loss: 0.1176 ||: 52%|#####1 | 49/95 [00:34<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8264, UAS: 0.9305, LAS: 0.8721, UEM: 0.5382, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3343, partial_loss/deprel_loss: 1.0364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2141, loss: 0.8611, batch_reg_loss: 0.1182, reg_loss: 0.1176 ||: 56%|#####5 | 53/95 [00:36<00:27, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9303, LAS: 0.8717, UEM: 0.5311, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8531, partial_loss/deprel_loss: 0.8836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9957, loss: 0.8645, batch_reg_loss: 0.1183, reg_loss: 0.1177 ||: 60%|###### | 57/95 [00:38<00:24, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9305, LAS: 0.8718, UEM: 0.5282, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6278, loss: 0.8638, batch_reg_loss: 0.1183, reg_loss: 0.1177 ||: 64%|######4 | 61/95 [00:41<00:22, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9321, LAS: 0.8736, UEM: 0.5395, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.5256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5979, loss: 0.8497, batch_reg_loss: 0.1184, reg_loss: 0.1178 ||: 68%|######8 | 65/95 [00:44<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9329, LAS: 0.8746, UEM: 0.5445, LEM: 0.2967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6270, loss: 0.8416, batch_reg_loss: 0.1185, reg_loss: 0.1178 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9326, LAS: 0.8743, UEM: 0.5391, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6426, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8412, loss: 0.8432, batch_reg_loss: 0.1186, reg_loss: 0.1178 ||: 76%|#######5 | 72/95 [00:49<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9332, LAS: 0.8750, UEM: 0.5475, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.8362, batch_reg_loss: 0.1186, reg_loss: 0.1179 ||: 79%|#######8 | 75/95 [00:52<00:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9341, LAS: 0.8760, UEM: 0.5571, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1853, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5045, loss: 0.8281, batch_reg_loss: 0.1187, reg_loss: 0.1179 ||: 82%|########2 | 78/95 [00:54<00:12, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9347, LAS: 0.8766, UEM: 0.5570, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2554, partial_loss/deprel_loss: 0.4840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.8217, batch_reg_loss: 0.1188, reg_loss: 0.1179 ||: 85%|########5 | 81/95 [00:56<00:10, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9342, LAS: 0.8760, UEM: 0.5472, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8270, partial_loss/deprel_loss: 0.9002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0044, loss: 0.8251, batch_reg_loss: 0.1188, reg_loss: 0.1180 ||: 89%|########9 | 85/95 [00:59<00:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9342, LAS: 0.8761, UEM: 0.5568, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6723, partial_loss/deprel_loss: 1.2662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4663, loss: 0.8257, batch_reg_loss: 0.1189, reg_loss: 0.1180 ||: 93%|#########2| 88/95 [01:01<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9342, LAS: 0.8763, UEM: 0.5618, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3461, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.8216, batch_reg_loss: 0.1189, reg_loss: 0.1180 ||: 96%|#########5| 91/95 [01:03<00:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9329, LAS: 0.8749, UEM: 0.5539, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6375, partial_loss/deprel_loss: 0.6770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8337, batch_reg_loss: 0.1190, reg_loss: 0.1181 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9329, LAS: 0.8749, UEM: 0.5539, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6375, partial_loss/deprel_loss: 0.6770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8337, batch_reg_loss: 0.1190, reg_loss: 0.1181 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:30:08,851 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9588, LAS: 0.9043, UEM: 0.7300, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2290, partial_loss/deprel_loss: 22.2542, partial_loss/cycle_loss: 0.0000, batch_loss: 17.8492, loss: 24.0080, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:03<00:08, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9461, LAS: 0.8875, UEM: 0.6354, LEM: 0.3292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3987, partial_loss/deprel_loss: 56.9363, partial_loss/cycle_loss: 0.0000, batch_loss: 45.8288, loss: 27.9184, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:06<00:05, 1.07s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9473, LAS: 0.8914, UEM: 0.6242, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3161, partial_loss/deprel_loss: 27.6688, partial_loss/cycle_loss: 0.0000, batch_loss: 22.1982, loss: 25.7038, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:09<00:02, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9482, LAS: 0.8943, UEM: 0.6692, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0665, partial_loss/deprel_loss: 47.8072, partial_loss/cycle_loss: 0.0000, batch_loss: 38.4590, loss: 25.9505, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00, 1.01s/it]\n", + "2023-04-06 23:30:19,988 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - reg_loss | 0.118 | 0.000\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UEM | 0.554 | 0.669\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - LEM | 0.307 | 0.395\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EM | 0.880 | 0.878\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.637 | 1.067\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UAS | 0.933 | 0.948\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.677 | 47.807\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - loss | 0.834 | 25.951\n", + "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | 0.894\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:19,991 - INFO - combo.training.trainer - Epoch duration: 0:01:17.315801\n", + "2023-04-06 23:30:19,991 - INFO - combo.training.trainer - Estimated training time remaining: 6:51:49\n", + "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - Epoch 36/399\n", + "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:30:19,998 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9477, LAS: 0.8948, UEM: 0.7414, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.3357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4228, loss: 0.6724, batch_reg_loss: 0.1191, reg_loss: 0.1190 ||: 3%|3 | 3/95 [00:02<01:18, 1.17it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9447, LAS: 0.8907, UEM: 0.7507, LEM: 0.5066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1926, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4823, loss: 0.7071, batch_reg_loss: 0.1191, reg_loss: 0.1191 ||: 6%|6 | 6/95 [00:04<01:14, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9437, LAS: 0.8877, UEM: 0.6831, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8091, partial_loss/deprel_loss: 0.8481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9595, loss: 0.7308, batch_reg_loss: 0.1192, reg_loss: 0.1191 ||: 9%|9 | 9/95 [00:07<01:08, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9433, LAS: 0.8878, UEM: 0.6720, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7337, batch_reg_loss: 0.1193, reg_loss: 0.1191 ||: 14%|#3 | 13/95 [00:09<01:01, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9337, LAS: 0.8770, UEM: 0.6113, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9070, partial_loss/deprel_loss: 0.9308, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0454, loss: 0.8210, batch_reg_loss: 0.1194, reg_loss: 0.1192 ||: 18%|#7 | 17/95 [00:12<00:55, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9360, LAS: 0.8786, UEM: 0.6085, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6687, partial_loss/deprel_loss: 0.8803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9574, loss: 0.8055, batch_reg_loss: 0.1194, reg_loss: 0.1192 ||: 22%|##2 | 21/95 [00:14<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9339, LAS: 0.8761, UEM: 0.5774, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4460, partial_loss/deprel_loss: 0.5838, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6758, loss: 0.8180, batch_reg_loss: 0.1195, reg_loss: 0.1193 ||: 26%|##6 | 25/95 [00:16<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9365, LAS: 0.8790, UEM: 0.5851, LEM: 0.3262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3892, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6353, loss: 0.7989, batch_reg_loss: 0.1196, reg_loss: 0.1193 ||: 31%|### | 29/95 [00:19<00:41, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9373, LAS: 0.8797, UEM: 0.5731, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4843, partial_loss/deprel_loss: 0.6256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7170, loss: 0.7960, batch_reg_loss: 0.1197, reg_loss: 0.1194 ||: 35%|###4 | 33/95 [00:21<00:37, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9384, LAS: 0.8806, UEM: 0.5733, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1741, partial_loss/deprel_loss: 0.3951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4707, loss: 0.7905, batch_reg_loss: 0.1198, reg_loss: 0.1194 ||: 39%|###8 | 37/95 [00:24<00:36, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9369, LAS: 0.8790, UEM: 0.5588, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5788, partial_loss/deprel_loss: 0.6406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7481, loss: 0.8037, batch_reg_loss: 0.1199, reg_loss: 0.1194 ||: 43%|####3 | 41/95 [00:26<00:33, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9392, LAS: 0.8820, UEM: 0.5883, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5245, loss: 0.7805, batch_reg_loss: 0.1199, reg_loss: 0.1195 ||: 47%|####7 | 45/95 [00:29<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.9385, LAS: 0.8812, UEM: 0.5812, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0758, partial_loss/deprel_loss: 1.0011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.7848, batch_reg_loss: 0.1200, reg_loss: 0.1195 ||: 52%|#####1 | 49/95 [00:32<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9356, LAS: 0.8781, UEM: 0.5654, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.6590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 0.8110, batch_reg_loss: 0.1201, reg_loss: 0.1196 ||: 56%|#####5 | 53/95 [00:34<00:26, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8106, UAS: 0.9349, LAS: 0.8773, UEM: 0.5602, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5064, partial_loss/deprel_loss: 1.1534, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3441, loss: 0.8169, batch_reg_loss: 0.1202, reg_loss: 0.1196 ||: 60%|###### | 57/95 [00:37<00:24, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9353, LAS: 0.8777, UEM: 0.5632, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0102, partial_loss/deprel_loss: 1.0672, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1761, loss: 0.8153, batch_reg_loss: 0.1202, reg_loss: 0.1196 ||: 64%|######4 | 61/95 [00:39<00:21, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9368, LAS: 0.8799, UEM: 0.5933, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.5073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6032, loss: 0.7989, batch_reg_loss: 0.1203, reg_loss: 0.1197 ||: 68%|######8 | 65/95 [00:43<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9374, LAS: 0.8805, UEM: 0.5959, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2705, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5253, loss: 0.7937, batch_reg_loss: 0.1204, reg_loss: 0.1197 ||: 72%|#######1 | 68/95 [00:45<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9362, LAS: 0.8789, UEM: 0.5825, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7992, partial_loss/deprel_loss: 0.8101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9284, loss: 0.8062, batch_reg_loss: 0.1205, reg_loss: 0.1198 ||: 76%|#######5 | 72/95 [00:47<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9347, LAS: 0.8771, UEM: 0.5741, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4389, partial_loss/deprel_loss: 0.6778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7506, loss: 0.8209, batch_reg_loss: 0.1206, reg_loss: 0.1198 ||: 80%|######## | 76/95 [00:50<00:12, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9343, LAS: 0.8766, UEM: 0.5661, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5118, partial_loss/deprel_loss: 0.6204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7193, loss: 0.8243, batch_reg_loss: 0.1206, reg_loss: 0.1198 ||: 84%|########4 | 80/95 [00:52<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9334, LAS: 0.8756, UEM: 0.5653, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4969, partial_loss/deprel_loss: 0.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.8302, batch_reg_loss: 0.1207, reg_loss: 0.1199 ||: 88%|########8 | 84/95 [00:55<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9330, LAS: 0.8751, UEM: 0.5612, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5179, partial_loss/deprel_loss: 0.6615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.8346, batch_reg_loss: 0.1208, reg_loss: 0.1199 ||: 92%|#########1| 87/95 [00:57<00:05, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9330, LAS: 0.8751, UEM: 0.5596, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.8357, batch_reg_loss: 0.1209, reg_loss: 0.1199 ||: 95%|#########4| 90/95 [00:59<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8294, UAS: 0.9328, LAS: 0.8748, UEM: 0.5558, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1469, partial_loss/deprel_loss: 1.0104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1587, loss: 0.8370, batch_reg_loss: 0.1210, reg_loss: 0.1200 ||: 99%|#########8| 94/95 [01:02<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9329, LAS: 0.8749, UEM: 0.5544, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5993, partial_loss/deprel_loss: 0.7079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.8367, batch_reg_loss: 0.1210, reg_loss: 0.1200 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-06 23:31:22,906 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - reg_loss | 0.120 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UEM | 0.554 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - LEM | 0.310 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EM | 0.884 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.599 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UAS | 0.933 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.708 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - loss | 0.837 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:22,908 - INFO - combo.training.trainer - Epoch duration: 0:01:02.917721\n", + "2023-04-06 23:31:22,909 - INFO - combo.training.trainer - Estimated training time remaining: 6:49:52\n", + "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - Epoch 37/399\n", + "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:31:22,916 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9514, LAS: 0.8954, UEM: 0.5949, LEM: 0.2786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6434, partial_loss/deprel_loss: 0.7854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8781, loss: 0.6990, batch_reg_loss: 0.1211, reg_loss: 0.1210 ||: 4%|4 | 4/95 [00:02<00:54, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9370, LAS: 0.8811, UEM: 0.5511, LEM: 0.2706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4832, partial_loss/deprel_loss: 0.6702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8023, batch_reg_loss: 0.1211, reg_loss: 0.1211 ||: 8%|8 | 8/95 [00:04<00:52, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9313, LAS: 0.8750, UEM: 0.4997, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6666, partial_loss/deprel_loss: 0.7253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8347, loss: 0.8502, batch_reg_loss: 0.1212, reg_loss: 0.1211 ||: 12%|#1 | 11/95 [00:06<00:53, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9320, LAS: 0.8754, UEM: 0.4993, LEM: 0.2396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7533, partial_loss/deprel_loss: 0.7773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8938, loss: 0.8417, batch_reg_loss: 0.1213, reg_loss: 0.1211 ||: 15%|#4 | 14/95 [00:09<00:54, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9336, LAS: 0.8763, UEM: 0.4745, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4635, partial_loss/deprel_loss: 0.5870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.8257, batch_reg_loss: 0.1214, reg_loss: 0.1212 ||: 19%|#8 | 18/95 [00:11<00:50, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9368, LAS: 0.8794, UEM: 0.5117, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5865, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8615, loss: 0.8011, batch_reg_loss: 0.1215, reg_loss: 0.1212 ||: 23%|##3 | 22/95 [00:14<00:47, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9362, LAS: 0.8787, UEM: 0.4922, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8021, partial_loss/deprel_loss: 0.8052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9261, loss: 0.8076, batch_reg_loss: 0.1215, reg_loss: 0.1213 ||: 27%|##7 | 26/95 [00:16<00:43, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9360, LAS: 0.8787, UEM: 0.4889, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.5390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6129, loss: 0.8082, batch_reg_loss: 0.1216, reg_loss: 0.1213 ||: 32%|###1 | 30/95 [00:19<00:43, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9366, LAS: 0.8795, UEM: 0.5116, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1484, partial_loss/deprel_loss: 0.3678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.8037, batch_reg_loss: 0.1217, reg_loss: 0.1213 ||: 35%|###4 | 33/95 [00:21<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9365, LAS: 0.8796, UEM: 0.5081, LEM: 0.2506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1201, partial_loss/deprel_loss: 0.9817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1311, loss: 0.8029, batch_reg_loss: 0.1217, reg_loss: 0.1214 ||: 38%|###7 | 36/95 [00:24<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9357, LAS: 0.8786, UEM: 0.5266, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.8096, batch_reg_loss: 0.1218, reg_loss: 0.1214 ||: 41%|####1 | 39/95 [00:26<00:40, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8265, UAS: 0.9358, LAS: 0.8790, UEM: 0.5437, LEM: 0.2860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2482, partial_loss/deprel_loss: 1.0411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2044, loss: 0.8043, batch_reg_loss: 0.1218, reg_loss: 0.1214 ||: 44%|####4 | 42/95 [00:29<00:40, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7986, UAS: 0.9314, LAS: 0.8745, UEM: 0.5338, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8628, partial_loss/deprel_loss: 1.1907, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4471, loss: 0.8394, batch_reg_loss: 0.1219, reg_loss: 0.1215 ||: 48%|####8 | 46/95 [00:31<00:36, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9324, LAS: 0.8757, UEM: 0.5487, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1373, partial_loss/deprel_loss: 0.2893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3809, loss: 0.8302, batch_reg_loss: 0.1220, reg_loss: 0.1215 ||: 52%|#####1 | 49/95 [00:33<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9332, LAS: 0.8763, UEM: 0.5467, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2825, partial_loss/deprel_loss: 0.4777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.8246, batch_reg_loss: 0.1221, reg_loss: 0.1215 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9329, LAS: 0.8760, UEM: 0.5492, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2645, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5817, loss: 0.8270, batch_reg_loss: 0.1221, reg_loss: 0.1216 ||: 58%|#####7 | 55/95 [00:38<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8588, UAS: 0.9322, LAS: 0.8753, UEM: 0.5408, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8819, partial_loss/deprel_loss: 0.8136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9494, loss: 0.8340, batch_reg_loss: 0.1222, reg_loss: 0.1216 ||: 61%|######1 | 58/95 [00:40<00:26, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8506, UAS: 0.9315, LAS: 0.8742, UEM: 0.5311, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0343, partial_loss/deprel_loss: 0.8963, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0462, loss: 0.8424, batch_reg_loss: 0.1222, reg_loss: 0.1216 ||: 64%|######4 | 61/95 [00:42<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9313, LAS: 0.8739, UEM: 0.5281, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3109, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.8451, batch_reg_loss: 0.1223, reg_loss: 0.1217 ||: 68%|######8 | 65/95 [00:44<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9308, LAS: 0.8734, UEM: 0.5217, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7375, loss: 0.8507, batch_reg_loss: 0.1224, reg_loss: 0.1217 ||: 73%|#######2 | 69/95 [00:47<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9316, LAS: 0.8742, UEM: 0.5276, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5359, partial_loss/deprel_loss: 0.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7521, loss: 0.8441, batch_reg_loss: 0.1225, reg_loss: 0.1218 ||: 77%|#######6 | 73/95 [00:50<00:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9317, LAS: 0.8741, UEM: 0.5278, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1349, partial_loss/deprel_loss: 1.0402, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1817, loss: 0.8445, batch_reg_loss: 0.1226, reg_loss: 0.1218 ||: 80%|######## | 76/95 [00:52<00:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9314, LAS: 0.8737, UEM: 0.5233, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0308, partial_loss/deprel_loss: 0.8860, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0376, loss: 0.8476, batch_reg_loss: 0.1226, reg_loss: 0.1218 ||: 83%|########3 | 79/95 [00:55<00:11, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9320, LAS: 0.8747, UEM: 0.5446, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.4654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5486, loss: 0.8411, batch_reg_loss: 0.1227, reg_loss: 0.1218 ||: 86%|########6 | 82/95 [00:57<00:10, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9321, LAS: 0.8748, UEM: 0.5496, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9542, partial_loss/deprel_loss: 1.0536, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1565, loss: 0.8409, batch_reg_loss: 0.1228, reg_loss: 0.1219 ||: 89%|########9 | 85/95 [01:00<00:07, 1.29it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9322, LAS: 0.8749, UEM: 0.5446, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7975, partial_loss/deprel_loss: 0.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.8398, batch_reg_loss: 0.1228, reg_loss: 0.1219 ||: 94%|#########3| 89/95 [01:02<00:04, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9325, LAS: 0.8750, UEM: 0.5452, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5842, partial_loss/deprel_loss: 0.7836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8666, loss: 0.8388, batch_reg_loss: 0.1229, reg_loss: 0.1219 ||: 97%|#########6| 92/95 [01:04<00:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9333, LAS: 0.8758, UEM: 0.5520, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6730, partial_loss/deprel_loss: 0.7886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8884, loss: 0.8336, batch_reg_loss: 0.1230, reg_loss: 0.1220 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-06 23:32:29,689 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - reg_loss | 0.122 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UEM | 0.552 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - LEM | 0.306 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EM | 0.875 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.673 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UAS | 0.933 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.789 | N/A\n", + "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - loss | 0.834 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - LAS | 0.876 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:32:29,692 - INFO - combo.training.trainer - Epoch duration: 0:01:06.782898\n", + "2023-04-06 23:32:29,692 - INFO - combo.training.trainer - Estimated training time remaining: 6:48:35\n", + "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - Epoch 38/399\n", + "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:32:29,699 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9468, LAS: 0.8878, UEM: 0.5179, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3875, partial_loss/deprel_loss: 0.5396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.7048, batch_reg_loss: 0.1230, reg_loss: 0.1230 ||: 3%|3 | 3/95 [00:02<01:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9404, LAS: 0.8853, UEM: 0.5849, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2919, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5523, loss: 0.7458, batch_reg_loss: 0.1231, reg_loss: 0.1230 ||: 6%|6 | 6/95 [00:04<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9322, LAS: 0.8764, UEM: 0.5648, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8550, partial_loss/deprel_loss: 0.9004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0144, loss: 0.8174, batch_reg_loss: 0.1231, reg_loss: 0.1231 ||: 11%|# | 10/95 [00:06<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9306, LAS: 0.8744, UEM: 0.5312, LEM: 0.2768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0999, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1245, loss: 0.8379, batch_reg_loss: 0.1232, reg_loss: 0.1231 ||: 15%|#4 | 14/95 [00:09<00:54, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9303, LAS: 0.8744, UEM: 0.5064, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5468, partial_loss/deprel_loss: 0.6683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7673, loss: 0.8399, batch_reg_loss: 0.1233, reg_loss: 0.1231 ||: 19%|#8 | 18/95 [00:11<00:51, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9305, LAS: 0.8738, UEM: 0.5088, LEM: 0.2519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2656, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5625, loss: 0.8459, batch_reg_loss: 0.1234, reg_loss: 0.1232 ||: 22%|##2 | 21/95 [00:14<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9296, LAS: 0.8724, UEM: 0.4969, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5105, partial_loss/deprel_loss: 1.2375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4156, loss: 0.8596, batch_reg_loss: 0.1234, reg_loss: 0.1232 ||: 26%|##6 | 25/95 [00:16<00:46, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9308, LAS: 0.8741, UEM: 0.5015, LEM: 0.2442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4046, partial_loss/deprel_loss: 0.6064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6896, loss: 0.8492, batch_reg_loss: 0.1235, reg_loss: 0.1232 ||: 29%|##9 | 28/95 [00:18<00:45, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9338, LAS: 0.8778, UEM: 0.5633, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5251, partial_loss/deprel_loss: 0.6847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7764, loss: 0.8249, batch_reg_loss: 0.1236, reg_loss: 0.1233 ||: 33%|###2 | 31/95 [00:21<00:45, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9338, LAS: 0.8776, UEM: 0.5580, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9901, partial_loss/deprel_loss: 0.9016, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0430, loss: 0.8267, batch_reg_loss: 0.1236, reg_loss: 0.1233 ||: 36%|###5 | 34/95 [00:23<00:42, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9350, LAS: 0.8789, UEM: 0.5612, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.5764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6822, loss: 0.8136, batch_reg_loss: 0.1237, reg_loss: 0.1233 ||: 39%|###8 | 37/95 [00:25<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9359, LAS: 0.8801, UEM: 0.5639, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.6427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7435, loss: 0.8035, batch_reg_loss: 0.1237, reg_loss: 0.1234 ||: 42%|####2 | 40/95 [00:27<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9368, LAS: 0.8812, UEM: 0.5744, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1437, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4183, loss: 0.7933, batch_reg_loss: 0.1238, reg_loss: 0.1234 ||: 45%|####5 | 43/95 [00:29<00:37, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9356, LAS: 0.8795, UEM: 0.5579, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.6600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.8057, batch_reg_loss: 0.1239, reg_loss: 0.1234 ||: 49%|####9 | 47/95 [00:32<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8432, UAS: 0.9358, LAS: 0.8798, UEM: 0.5603, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9331, partial_loss/deprel_loss: 0.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9967, loss: 0.8002, batch_reg_loss: 0.1239, reg_loss: 0.1235 ||: 53%|#####2 | 50/95 [00:34<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8193, UAS: 0.9354, LAS: 0.8789, UEM: 0.5552, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3234, partial_loss/deprel_loss: 1.0071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1944, loss: 0.8053, batch_reg_loss: 0.1240, reg_loss: 0.1235 ||: 57%|#####6 | 54/95 [00:36<00:27, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9363, LAS: 0.8802, UEM: 0.5559, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2073, partial_loss/deprel_loss: 0.5454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.7968, batch_reg_loss: 0.1241, reg_loss: 0.1235 ||: 61%|######1 | 58/95 [00:39<00:23, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9352, LAS: 0.8788, UEM: 0.5565, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5459, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8291, loss: 0.8069, batch_reg_loss: 0.1241, reg_loss: 0.1236 ||: 65%|######5 | 62/95 [00:41<00:21, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9360, LAS: 0.8799, UEM: 0.5602, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.5754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6562, loss: 0.7988, batch_reg_loss: 0.1242, reg_loss: 0.1236 ||: 69%|######9 | 66/95 [00:44<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9357, LAS: 0.8793, UEM: 0.5555, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5896, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8511, loss: 0.8060, batch_reg_loss: 0.1243, reg_loss: 0.1236 ||: 74%|#######3 | 70/95 [00:47<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9362, LAS: 0.8798, UEM: 0.5560, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7461, partial_loss/deprel_loss: 0.7575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8796, loss: 0.8015, batch_reg_loss: 0.1243, reg_loss: 0.1237 ||: 77%|#######6 | 73/95 [00:50<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9359, LAS: 0.8796, UEM: 0.5522, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1170, partial_loss/deprel_loss: 1.0188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1628, loss: 0.8031, batch_reg_loss: 0.1244, reg_loss: 0.1237 ||: 80%|######## | 76/95 [00:52<00:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9371, LAS: 0.8808, UEM: 0.5712, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.7918, batch_reg_loss: 0.1245, reg_loss: 0.1237 ||: 83%|########3 | 79/95 [00:54<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7651, UAS: 0.9347, LAS: 0.8780, UEM: 0.5644, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1664, partial_loss/deprel_loss: 1.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7326, loss: 0.8152, batch_reg_loss: 0.1245, reg_loss: 0.1238 ||: 86%|########6 | 82/95 [00:56<00:09, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9344, LAS: 0.8776, UEM: 0.5591, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3251, partial_loss/deprel_loss: 0.5764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8192, batch_reg_loss: 0.1246, reg_loss: 0.1238 ||: 91%|######### | 86/95 [00:59<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8431, UAS: 0.9337, LAS: 0.8768, UEM: 0.5541, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9655, partial_loss/deprel_loss: 0.9398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0696, loss: 0.8243, batch_reg_loss: 0.1247, reg_loss: 0.1238 ||: 95%|#########4| 90/95 [01:02<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9334, LAS: 0.8764, UEM: 0.5476, LEM: 0.3011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9685, partial_loss/deprel_loss: 0.8837, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0254, loss: 0.8279, batch_reg_loss: 0.1247, reg_loss: 0.1239 ||: 98%|#########7| 93/95 [01:04<00:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9338, LAS: 0.8769, UEM: 0.5566, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3800, loss: 0.8233, batch_reg_loss: 0.1248, reg_loss: 0.1239 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - reg_loss | 0.124 | N/A\n", + "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UEM | 0.557 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LEM | 0.312 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.139 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UAS | 0.934 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.284 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - loss | 0.823 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LAS | 0.877 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:33:35,457 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:35,457 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:35,457 - INFO - combo.training.trainer - Epoch duration: 0:01:05.765487\n", + "2023-04-06 23:33:35,457 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:10\n", + "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - Epoch 39/399\n", + "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:33:35,465 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7854, UAS: 0.9013, LAS: 0.8406, UEM: 0.2256, LEM: 0.0677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9358, partial_loss/deprel_loss: 1.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5643, loss: 1.1230, batch_reg_loss: 0.1249, reg_loss: 0.1248 ||: 3%|3 | 3/95 [00:02<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9146, LAS: 0.8558, UEM: 0.3082, LEM: 0.0959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4825, partial_loss/deprel_loss: 0.6405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7338, loss: 1.0103, batch_reg_loss: 0.1249, reg_loss: 0.1249 ||: 6%|6 | 6/95 [00:04<01:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9284, LAS: 0.8724, UEM: 0.5318, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2490, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.8735, batch_reg_loss: 0.1250, reg_loss: 0.1249 ||: 11%|# | 10/95 [00:07<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9343, LAS: 0.8784, UEM: 0.5593, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5965, partial_loss/deprel_loss: 0.7453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8407, loss: 0.8243, batch_reg_loss: 0.1251, reg_loss: 0.1249 ||: 14%|#3 | 13/95 [00:09<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9323, LAS: 0.8762, UEM: 0.5283, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6944, loss: 0.8411, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||: 17%|#6 | 16/95 [00:11<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9370, LAS: 0.8817, UEM: 0.6207, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1209, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3726, loss: 0.7979, batch_reg_loss: 0.1252, reg_loss: 0.1250 ||: 20%|## | 19/95 [00:13<00:56, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9374, LAS: 0.8823, UEM: 0.6201, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0154, partial_loss/deprel_loss: 0.9240, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0676, loss: 0.7916, batch_reg_loss: 0.1253, reg_loss: 0.1250 ||: 23%|##3 | 22/95 [00:16<00:55, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9358, LAS: 0.8805, UEM: 0.6121, LEM: 0.3726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1837, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4560, loss: 0.8050, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||: 27%|##7 | 26/95 [00:18<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9380, LAS: 0.8832, UEM: 0.6298, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.7793, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||: 31%|### | 29/95 [00:21<00:54, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9364, LAS: 0.8817, UEM: 0.6136, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.4977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6073, loss: 0.7870, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||: 34%|###3 | 32/95 [00:23<00:49, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9369, LAS: 0.8820, UEM: 0.6008, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2908, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5950, loss: 0.7869, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||: 38%|###7 | 36/95 [00:26<00:44, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9359, LAS: 0.8805, UEM: 0.5898, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4490, partial_loss/deprel_loss: 0.5749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.7989, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||: 41%|####1 | 39/95 [00:28<00:40, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9365, LAS: 0.8817, UEM: 0.6143, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5383, partial_loss/deprel_loss: 0.6646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7650, loss: 0.7930, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||: 44%|####4 | 42/95 [00:31<00:41, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9361, LAS: 0.8814, UEM: 0.6079, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3776, partial_loss/deprel_loss: 0.5837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6681, loss: 0.7952, batch_reg_loss: 0.1257, reg_loss: 0.1253 ||: 47%|####7 | 45/95 [00:33<00:37, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9357, LAS: 0.8805, UEM: 0.5984, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3667, partial_loss/deprel_loss: 0.5887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6700, loss: 0.8030, batch_reg_loss: 0.1258, reg_loss: 0.1253 ||: 52%|#####1 | 49/95 [00:36<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9373, LAS: 0.8821, UEM: 0.6066, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2052, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4849, loss: 0.7901, batch_reg_loss: 0.1259, reg_loss: 0.1253 ||: 56%|#####5 | 53/95 [00:38<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9367, LAS: 0.8813, UEM: 0.5989, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.5433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6287, loss: 0.7944, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||: 59%|#####8 | 56/95 [00:40<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9367, LAS: 0.8811, UEM: 0.5948, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6581, partial_loss/deprel_loss: 0.7599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8655, loss: 0.7959, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||: 62%|######2 | 59/95 [00:42<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9377, LAS: 0.8821, UEM: 0.5973, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2486, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5335, loss: 0.7878, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||: 65%|######5 | 62/95 [00:45<00:23, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9366, LAS: 0.8807, UEM: 0.5859, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7358, partial_loss/deprel_loss: 0.8422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.7992, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||: 68%|######8 | 65/95 [00:47<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9368, LAS: 0.8807, UEM: 0.5874, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2687, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5739, loss: 0.7989, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||: 73%|#######2 | 69/95 [00:49<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7954, UAS: 0.9347, LAS: 0.8782, UEM: 0.5760, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8442, partial_loss/deprel_loss: 1.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4556, loss: 0.8182, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||: 77%|#######6 | 73/95 [00:52<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9348, LAS: 0.8782, UEM: 0.5740, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1669, partial_loss/deprel_loss: 1.1540, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2829, loss: 0.8196, batch_reg_loss: 0.1263, reg_loss: 0.1256 ||: 80%|######## | 76/95 [00:54<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9344, LAS: 0.8778, UEM: 0.5651, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 0.7363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.8245, batch_reg_loss: 0.1264, reg_loss: 0.1256 ||: 84%|########4 | 80/95 [00:56<00:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9346, LAS: 0.8778, UEM: 0.5585, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.6359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8251, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||: 88%|########8 | 84/95 [00:59<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9349, LAS: 0.8780, UEM: 0.5571, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7289, partial_loss/deprel_loss: 0.8303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9366, loss: 0.8227, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||: 92%|#########1| 87/95 [01:01<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9353, LAS: 0.8782, UEM: 0.5545, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4038, partial_loss/deprel_loss: 0.5717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6647, loss: 0.8211, batch_reg_loss: 0.1266, reg_loss: 0.1257 ||: 96%|#########5| 91/95 [01:04<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9357, LAS: 0.8788, UEM: 0.5600, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3942, partial_loss/deprel_loss: 0.5844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.8153, batch_reg_loss: 0.1267, reg_loss: 0.1257 ||: 99%|#########8| 94/95 [01:06<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7955, UAS: 0.9349, LAS: 0.8780, UEM: 0.5581, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7372, partial_loss/deprel_loss: 1.3056, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5186, loss: 0.8227, batch_reg_loss: 0.1267, reg_loss: 0.1258 ||: 100%|##########| 95/95 [01:07<00:00, 1.41it/s]\n", + "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer - reg_loss | 0.126 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UEM | 0.558 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LEM | 0.311 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EM | 0.795 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.737 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UAS | 0.935 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.306 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - loss | 0.823 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LAS | 0.878 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:42,926 - INFO - combo.training.trainer - Epoch duration: 0:01:07.468682\n", + "2023-04-06 23:34:42,926 - INFO - combo.training.trainer - Estimated training time remaining: 6:46:00\n", + "2023-04-06 23:34:42,926 - INFO - allennlp.training.trainer - Epoch 40/399\n", + "2023-04-06 23:34:42,927 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:34:42,927 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:34:42,933 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9400, LAS: 0.8828, UEM: 0.4868, LEM: 0.2070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6732, partial_loss/deprel_loss: 0.7949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8036, batch_reg_loss: 0.1268, reg_loss: 0.1267 ||: 4%|4 | 4/95 [00:02<00:51, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9421, LAS: 0.8870, UEM: 0.4658, LEM: 0.1947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6863, partial_loss/deprel_loss: 0.7191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8394, loss: 0.7717, batch_reg_loss: 0.1268, reg_loss: 0.1268 ||: 7%|7 | 7/95 [00:04<00:55, 1.59it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9476, LAS: 0.8928, UEM: 0.5637, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.4735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.7269, batch_reg_loss: 0.1269, reg_loss: 0.1268 ||: 11%|# | 10/95 [00:07<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9404, LAS: 0.8855, UEM: 0.5344, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3865, partial_loss/deprel_loss: 0.5412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6372, loss: 0.7765, batch_reg_loss: 0.1269, reg_loss: 0.1268 ||: 14%|#3 | 13/95 [00:09<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9422, LAS: 0.8870, UEM: 0.5699, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.7601, batch_reg_loss: 0.1270, reg_loss: 0.1268 ||: 17%|#6 | 16/95 [00:11<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9428, LAS: 0.8874, UEM: 0.5908, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.7553, batch_reg_loss: 0.1270, reg_loss: 0.1269 ||: 20%|## | 19/95 [00:13<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7986, UAS: 0.9376, LAS: 0.8821, UEM: 0.5716, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7296, partial_loss/deprel_loss: 1.2162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4460, loss: 0.8000, batch_reg_loss: 0.1271, reg_loss: 0.1269 ||: 24%|##4 | 23/95 [00:16<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9389, LAS: 0.8848, UEM: 0.6288, LEM: 0.3959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2579, partial_loss/deprel_loss: 0.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.7762, batch_reg_loss: 0.1272, reg_loss: 0.1269 ||: 27%|##7 | 26/95 [00:19<00:53, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9381, LAS: 0.8835, UEM: 0.6019, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6894, partial_loss/deprel_loss: 0.6837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8121, loss: 0.7863, batch_reg_loss: 0.1273, reg_loss: 0.1270 ||: 32%|###1 | 30/95 [00:21<00:47, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9404, LAS: 0.8862, UEM: 0.6130, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2661, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.7672, batch_reg_loss: 0.1273, reg_loss: 0.1270 ||: 35%|###4 | 33/95 [00:23<00:44, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9384, LAS: 0.8841, UEM: 0.5955, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6464, loss: 0.7814, batch_reg_loss: 0.1274, reg_loss: 0.1270 ||: 39%|###8 | 37/95 [00:26<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9361, LAS: 0.8813, UEM: 0.5781, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1116, partial_loss/deprel_loss: 0.9277, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0919, loss: 0.8044, batch_reg_loss: 0.1274, reg_loss: 0.1271 ||: 42%|####2 | 40/95 [00:28<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9349, LAS: 0.8800, UEM: 0.5685, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0994, partial_loss/deprel_loss: 0.9195, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0830, loss: 0.8124, batch_reg_loss: 0.1275, reg_loss: 0.1271 ||: 45%|####5 | 43/95 [00:31<00:38, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9339, LAS: 0.8786, UEM: 0.5597, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7561, partial_loss/deprel_loss: 0.8972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9965, loss: 0.8232, batch_reg_loss: 0.1275, reg_loss: 0.1271 ||: 48%|####8 | 46/95 [00:33<00:37, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9345, LAS: 0.8791, UEM: 0.5693, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.3585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4392, loss: 0.8194, batch_reg_loss: 0.1276, reg_loss: 0.1272 ||: 52%|#####1 | 49/95 [00:35<00:35, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9347, LAS: 0.8792, UEM: 0.5634, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3834, partial_loss/deprel_loss: 0.5559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6491, loss: 0.8214, batch_reg_loss: 0.1277, reg_loss: 0.1272 ||: 55%|#####4 | 52/95 [00:38<00:32, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9352, LAS: 0.8798, UEM: 0.5676, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4259, partial_loss/deprel_loss: 1.1430, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3273, loss: 0.8205, batch_reg_loss: 0.1277, reg_loss: 0.1272 ||: 58%|#####7 | 55/95 [00:40<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9358, LAS: 0.8805, UEM: 0.5735, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.4667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5406, loss: 0.8155, batch_reg_loss: 0.1278, reg_loss: 0.1272 ||: 61%|######1 | 58/95 [00:42<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9364, LAS: 0.8807, UEM: 0.5704, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6597, partial_loss/deprel_loss: 0.7953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8960, loss: 0.8129, batch_reg_loss: 0.1279, reg_loss: 0.1273 ||: 65%|######5 | 62/95 [00:44<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9368, LAS: 0.8811, UEM: 0.5682, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7439, loss: 0.8092, batch_reg_loss: 0.1279, reg_loss: 0.1273 ||: 68%|######8 | 65/95 [00:46<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7714, UAS: 0.9352, LAS: 0.8794, UEM: 0.5582, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2057, partial_loss/deprel_loss: 1.4002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6893, loss: 0.8228, batch_reg_loss: 0.1280, reg_loss: 0.1273 ||: 73%|#######2 | 69/95 [00:49<00:17, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9349, LAS: 0.8790, UEM: 0.5481, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9324, partial_loss/deprel_loss: 0.9164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0477, loss: 0.8266, batch_reg_loss: 0.1281, reg_loss: 0.1274 ||: 77%|#######6 | 73/95 [00:51<00:13, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9343, LAS: 0.8782, UEM: 0.5396, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4719, partial_loss/deprel_loss: 0.6551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.8310, batch_reg_loss: 0.1282, reg_loss: 0.1274 ||: 81%|########1 | 77/95 [00:54<00:11, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9355, LAS: 0.8795, UEM: 0.5530, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7067, loss: 0.8195, batch_reg_loss: 0.1283, reg_loss: 0.1275 ||: 85%|########5 | 81/95 [00:56<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9354, LAS: 0.8793, UEM: 0.5509, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.5590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.8217, batch_reg_loss: 0.1283, reg_loss: 0.1275 ||: 89%|########9 | 85/95 [00:59<00:06, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9360, LAS: 0.8801, UEM: 0.5586, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8639, partial_loss/deprel_loss: 0.7844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9288, loss: 0.8147, batch_reg_loss: 0.1284, reg_loss: 0.1275 ||: 94%|#########3| 89/95 [01:02<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.9354, LAS: 0.8793, UEM: 0.5562, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1743, partial_loss/deprel_loss: 0.9940, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1585, loss: 0.8192, batch_reg_loss: 0.1285, reg_loss: 0.1276 ||: 98%|#########7| 93/95 [01:04<00:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9352, LAS: 0.8793, UEM: 0.5649, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1439, partial_loss/deprel_loss: 0.2729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3757, loss: 0.8192, batch_reg_loss: 0.1285, reg_loss: 0.1276 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "2023-04-06 23:35:48,999 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9453, LAS: 0.8944, UEM: 0.7057, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2201, partial_loss/deprel_loss: 22.8404, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3164, loss: 29.2944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9470, LAS: 0.8957, UEM: 0.6582, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 24.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7073, loss: 24.2815, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9471, LAS: 0.8932, UEM: 0.6188, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2938, partial_loss/deprel_loss: 28.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7890, loss: 26.0436, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9459, LAS: 0.8926, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 19.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9814, loss: 26.8978, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9459, LAS: 0.8926, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 19.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9814, loss: 26.8978, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02it/s]\n", + "2023-04-06 23:35:59,794 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - reg_loss | 0.128 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UEM | 0.565 | 0.667\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LEM | 0.321 | 0.398\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EM | 0.936 | 0.937\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.144 | 0.219\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UAS | 0.935 | 0.946\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.273 | 19.922\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - loss | 0.819 | 26.898\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LAS | 0.879 | 0.893\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:35:59,796 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:35:59,796 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:35:59,796 - INFO - combo.training.trainer - Epoch duration: 0:01:16.869728\n", + "2023-04-06 23:35:59,796 - INFO - combo.training.trainer - Estimated training time remaining: 6:46:13\n", + "2023-04-06 23:35:59,796 - INFO - allennlp.training.trainer - Epoch 41/399\n", + "2023-04-06 23:35:59,796 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:35:59,797 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:35:59,803 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9360, LAS: 0.8791, UEM: 0.4178, LEM: 0.1620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7190, partial_loss/deprel_loss: 0.8510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9532, loss: 0.8111, batch_reg_loss: 0.1286, reg_loss: 0.1286 ||: 3%|3 | 3/95 [00:02<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8220, UAS: 0.9273, LAS: 0.8723, UEM: 0.3843, LEM: 0.1462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3957, partial_loss/deprel_loss: 1.0064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2129, loss: 0.8524, batch_reg_loss: 0.1287, reg_loss: 0.1286 ||: 7%|7 | 7/95 [00:04<00:58, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9241, LAS: 0.8685, UEM: 0.3692, LEM: 0.1388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4538, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.8688, batch_reg_loss: 0.1287, reg_loss: 0.1286 ||: 12%|#1 | 11/95 [00:06<00:53, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9240, LAS: 0.8673, UEM: 0.3374, LEM: 0.1240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1968, partial_loss/deprel_loss: 0.8812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0732, loss: 0.8840, batch_reg_loss: 0.1288, reg_loss: 0.1287 ||: 16%|#5 | 15/95 [00:09<00:50, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9250, LAS: 0.8676, UEM: 0.3484, LEM: 0.1303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7812, partial_loss/deprel_loss: 0.8881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9956, loss: 0.8889, batch_reg_loss: 0.1289, reg_loss: 0.1287 ||: 19%|#8 | 18/95 [00:11<00:50, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8025, UAS: 0.9218, LAS: 0.8643, UEM: 0.3429, LEM: 0.1296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8468, partial_loss/deprel_loss: 1.1586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4252, loss: 0.9182, batch_reg_loss: 0.1289, reg_loss: 0.1287 ||: 22%|##2 | 21/95 [00:13<00:49, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9241, LAS: 0.8671, UEM: 0.3746, LEM: 0.1478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4220, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6546, loss: 0.8955, batch_reg_loss: 0.1290, reg_loss: 0.1288 ||: 25%|##5 | 24/95 [00:16<00:50, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9262, LAS: 0.8692, UEM: 0.3980, LEM: 0.1641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2627, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5544, loss: 0.8827, batch_reg_loss: 0.1291, reg_loss: 0.1288 ||: 28%|##8 | 27/95 [00:18<00:47, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9284, LAS: 0.8709, UEM: 0.4256, LEM: 0.1786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0322, partial_loss/deprel_loss: 0.9060, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0604, loss: 0.8674, batch_reg_loss: 0.1292, reg_loss: 0.1288 ||: 33%|###2 | 31/95 [00:20<00:42, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9290, LAS: 0.8714, UEM: 0.4254, LEM: 0.1775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8132, partial_loss/deprel_loss: 0.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9964, loss: 0.8620, batch_reg_loss: 0.1292, reg_loss: 0.1289 ||: 36%|###5 | 34/95 [00:22<00:42, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9295, LAS: 0.8721, UEM: 0.4283, LEM: 0.1798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8416, loss: 0.8553, batch_reg_loss: 0.1293, reg_loss: 0.1289 ||: 40%|#### | 38/95 [00:25<00:38, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9303, LAS: 0.8732, UEM: 0.4489, LEM: 0.2006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0398, partial_loss/deprel_loss: 0.9269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0788, loss: 0.8499, batch_reg_loss: 0.1294, reg_loss: 0.1289 ||: 43%|####3 | 41/95 [00:27<00:36, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9306, LAS: 0.8737, UEM: 0.4761, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.2568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3622, loss: 0.8484, batch_reg_loss: 0.1294, reg_loss: 0.1290 ||: 46%|####6 | 44/95 [00:29<00:36, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9313, LAS: 0.8745, UEM: 0.4715, LEM: 0.2310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5074, partial_loss/deprel_loss: 0.6380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7414, loss: 0.8422, batch_reg_loss: 0.1295, reg_loss: 0.1290 ||: 51%|##### | 48/95 [00:32<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9327, LAS: 0.8761, UEM: 0.4949, LEM: 0.2510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6366, partial_loss/deprel_loss: 0.7918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8903, loss: 0.8296, batch_reg_loss: 0.1295, reg_loss: 0.1290 ||: 54%|#####3 | 51/95 [00:34<00:31, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.9322, LAS: 0.8756, UEM: 0.4983, LEM: 0.2559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3103, partial_loss/deprel_loss: 1.1247, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2914, loss: 0.8344, batch_reg_loss: 0.1296, reg_loss: 0.1291 ||: 58%|#####7 | 55/95 [00:36<00:27, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7698, UAS: 0.9314, LAS: 0.8749, UEM: 0.5076, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0794, partial_loss/deprel_loss: 1.3318, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6110, loss: 0.8396, batch_reg_loss: 0.1297, reg_loss: 0.1291 ||: 61%|######1 | 58/95 [00:39<00:25, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9332, LAS: 0.8771, UEM: 0.5475, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4219, partial_loss/deprel_loss: 0.5777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6762, loss: 0.8229, batch_reg_loss: 0.1297, reg_loss: 0.1291 ||: 64%|######4 | 61/95 [00:41<00:25, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9341, LAS: 0.8781, UEM: 0.5496, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.8169, batch_reg_loss: 0.1298, reg_loss: 0.1292 ||: 67%|######7 | 64/95 [00:43<00:23, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9342, LAS: 0.8783, UEM: 0.5438, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4889, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8161, batch_reg_loss: 0.1298, reg_loss: 0.1292 ||: 71%|####### | 67/95 [00:46<00:20, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8365, UAS: 0.9343, LAS: 0.8784, UEM: 0.5427, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1633, partial_loss/deprel_loss: 1.0104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1708, loss: 0.8170, batch_reg_loss: 0.1299, reg_loss: 0.1292 ||: 74%|#######3 | 70/95 [00:48<00:18, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9327, LAS: 0.8766, UEM: 0.5300, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9013, partial_loss/deprel_loss: 0.9811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0951, loss: 0.8309, batch_reg_loss: 0.1300, reg_loss: 0.1293 ||: 78%|#######7 | 74/95 [00:50<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9333, LAS: 0.8771, UEM: 0.5329, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2841, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5919, loss: 0.8263, batch_reg_loss: 0.1300, reg_loss: 0.1293 ||: 81%|########1 | 77/95 [00:53<00:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9342, LAS: 0.8780, UEM: 0.5402, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.8205, batch_reg_loss: 0.1301, reg_loss: 0.1293 ||: 84%|########4 | 80/95 [00:55<00:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9349, LAS: 0.8785, UEM: 0.5445, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3958, partial_loss/deprel_loss: 0.6372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.8184, batch_reg_loss: 0.1302, reg_loss: 0.1294 ||: 88%|########8 | 84/95 [00:57<00:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9345, LAS: 0.8780, UEM: 0.5462, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.5278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6132, loss: 0.8204, batch_reg_loss: 0.1302, reg_loss: 0.1294 ||: 92%|#########1| 87/95 [01:00<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9350, LAS: 0.8786, UEM: 0.5507, LEM: 0.3049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.8158, batch_reg_loss: 0.1303, reg_loss: 0.1294 ||: 95%|#########4| 90/95 [01:02<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9341, LAS: 0.8776, UEM: 0.5549, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1568, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.8229, batch_reg_loss: 0.1303, reg_loss: 0.1295 ||: 98%|#########7| 93/95 [01:04<00:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9344, LAS: 0.8780, UEM: 0.5592, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4078, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6911, loss: 0.8183, batch_reg_loss: 0.1304, reg_loss: 0.1295 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - reg_loss | 0.129 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UEM | 0.559 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - LEM | 0.315 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EM | 0.890 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.408 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UAS | 0.934 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.599 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - loss | 0.818 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - LAS | 0.878 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:37:05,774 - INFO - combo.training.trainer - Epoch duration: 0:01:05.977443\n", + "2023-04-06 23:37:05,774 - INFO - combo.training.trainer - Estimated training time remaining: 6:44:49\n", + "2023-04-06 23:37:05,774 - INFO - allennlp.training.trainer - Epoch 42/399\n", + "2023-04-06 23:37:05,774 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:37:05,775 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:37:05,781 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9303, LAS: 0.8783, UEM: 0.6649, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.8148, batch_reg_loss: 0.1304, reg_loss: 0.1304 ||: 4%|4 | 4/95 [00:02<00:52, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9310, LAS: 0.8747, UEM: 0.5858, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5777, partial_loss/deprel_loss: 0.7217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8234, loss: 0.8341, batch_reg_loss: 0.1305, reg_loss: 0.1305 ||: 8%|8 | 8/95 [00:04<00:49, 1.76it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8432, UAS: 0.9321, LAS: 0.8765, UEM: 0.5879, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9779, partial_loss/deprel_loss: 0.9717, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1036, loss: 0.8301, batch_reg_loss: 0.1306, reg_loss: 0.1305 ||: 13%|#2 | 12/95 [00:07<00:48, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9364, LAS: 0.8806, UEM: 0.6022, LEM: 0.3424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.7917, batch_reg_loss: 0.1307, reg_loss: 0.1305 ||: 17%|#6 | 16/95 [00:09<00:47, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9375, LAS: 0.8823, UEM: 0.5799, LEM: 0.3194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6576, loss: 0.7849, batch_reg_loss: 0.1307, reg_loss: 0.1306 ||: 21%|##1 | 20/95 [00:11<00:43, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9379, LAS: 0.8825, UEM: 0.5854, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1910, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.7820, batch_reg_loss: 0.1308, reg_loss: 0.1306 ||: 24%|##4 | 23/95 [00:13<00:43, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9385, LAS: 0.8835, UEM: 0.5862, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6477, loss: 0.7759, batch_reg_loss: 0.1308, reg_loss: 0.1306 ||: 27%|##7 | 26/95 [00:15<00:43, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9382, LAS: 0.8834, UEM: 0.5912, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.7758, batch_reg_loss: 0.1309, reg_loss: 0.1306 ||: 31%|### | 29/95 [00:18<00:44, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9363, LAS: 0.8811, UEM: 0.5848, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.5942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6923, loss: 0.7947, batch_reg_loss: 0.1310, reg_loss: 0.1307 ||: 34%|###3 | 32/95 [00:20<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9350, LAS: 0.8798, UEM: 0.5674, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.8855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0096, loss: 0.8071, batch_reg_loss: 0.1310, reg_loss: 0.1307 ||: 37%|###6 | 35/95 [00:22<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9367, LAS: 0.8819, UEM: 0.5845, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3981, partial_loss/deprel_loss: 0.5429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.7921, batch_reg_loss: 0.1311, reg_loss: 0.1307 ||: 41%|####1 | 39/95 [00:24<00:37, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9352, LAS: 0.8802, UEM: 0.5727, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1738, partial_loss/deprel_loss: 0.9203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1022, loss: 0.8053, batch_reg_loss: 0.1312, reg_loss: 0.1308 ||: 45%|####5 | 43/95 [00:27<00:34, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9348, LAS: 0.8799, UEM: 0.5619, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6058, partial_loss/deprel_loss: 0.7052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8165, loss: 0.8099, batch_reg_loss: 0.1312, reg_loss: 0.1308 ||: 48%|####8 | 46/95 [00:29<00:33, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9329, LAS: 0.8774, UEM: 0.5492, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4213, partial_loss/deprel_loss: 0.5934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6902, loss: 0.8315, batch_reg_loss: 0.1313, reg_loss: 0.1308 ||: 53%|#####2 | 50/95 [00:32<00:30, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9343, LAS: 0.8790, UEM: 0.5635, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2668, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5067, loss: 0.8181, batch_reg_loss: 0.1314, reg_loss: 0.1309 ||: 56%|#####5 | 53/95 [00:34<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9334, LAS: 0.8781, UEM: 0.5632, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.5907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6931, loss: 0.8239, batch_reg_loss: 0.1314, reg_loss: 0.1309 ||: 59%|#####8 | 56/95 [00:36<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9340, LAS: 0.8785, UEM: 0.5642, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2055, partial_loss/deprel_loss: 0.3961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4895, loss: 0.8222, batch_reg_loss: 0.1315, reg_loss: 0.1309 ||: 62%|######2 | 59/95 [00:39<00:26, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9346, LAS: 0.8796, UEM: 0.5936, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0504, partial_loss/deprel_loss: 0.1567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2670, loss: 0.8129, batch_reg_loss: 0.1315, reg_loss: 0.1310 ||: 65%|######5 | 62/95 [00:41<00:25, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9339, LAS: 0.8788, UEM: 0.5859, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8858, partial_loss/deprel_loss: 0.8773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0106, loss: 0.8194, batch_reg_loss: 0.1316, reg_loss: 0.1310 ||: 69%|######9 | 66/95 [00:44<00:20, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9333, LAS: 0.8780, UEM: 0.5756, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6500, partial_loss/deprel_loss: 0.7221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8394, loss: 0.8262, batch_reg_loss: 0.1317, reg_loss: 0.1310 ||: 74%|#######3 | 70/95 [00:46<00:17, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9338, LAS: 0.8782, UEM: 0.5723, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.8831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0087, loss: 0.8255, batch_reg_loss: 0.1318, reg_loss: 0.1311 ||: 78%|#######7 | 74/95 [00:48<00:13, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9341, LAS: 0.8784, UEM: 0.5675, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6659, loss: 0.8236, batch_reg_loss: 0.1319, reg_loss: 0.1311 ||: 82%|########2 | 78/95 [00:51<00:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9351, LAS: 0.8792, UEM: 0.5704, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.4452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5272, loss: 0.8173, batch_reg_loss: 0.1319, reg_loss: 0.1311 ||: 86%|########6 | 82/95 [00:54<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9355, LAS: 0.8796, UEM: 0.5687, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5372, loss: 0.8150, batch_reg_loss: 0.1320, reg_loss: 0.1312 ||: 91%|######### | 86/95 [00:57<00:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9360, LAS: 0.8801, UEM: 0.5755, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3179, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8097, batch_reg_loss: 0.1321, reg_loss: 0.1312 ||: 95%|#########4| 90/95 [01:00<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.9359, LAS: 0.8798, UEM: 0.5678, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7598, partial_loss/deprel_loss: 0.8543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9676, loss: 0.8136, batch_reg_loss: 0.1321, reg_loss: 0.1313 ||: 99%|#########8| 94/95 [01:02<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9355, LAS: 0.8793, UEM: 0.5654, LEM: 0.3171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3172, partial_loss/deprel_loss: 1.0476, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2337, loss: 0.8180, batch_reg_loss: 0.1322, reg_loss: 0.1313 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - reg_loss | 0.131 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UEM | 0.565 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - LEM | 0.317 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EM | 0.831 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.317 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UAS | 0.935 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.048 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - loss | 0.818 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - LAS | 0.879 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:09,337 - INFO - combo.training.trainer - Epoch duration: 0:01:03.562509\n", + "2023-04-06 23:38:09,337 - INFO - combo.training.trainer - Estimated training time remaining: 6:43:05\n", + "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - Epoch 43/399\n", + "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:38:09,344 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9328, LAS: 0.8776, UEM: 0.5302, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2034, partial_loss/deprel_loss: 0.3875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.8172, batch_reg_loss: 0.1322, reg_loss: 0.1322 ||: 4%|4 | 4/95 [00:02<01:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9293, LAS: 0.8726, UEM: 0.5152, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5698, loss: 0.8541, batch_reg_loss: 0.1323, reg_loss: 0.1322 ||: 7%|7 | 7/95 [00:05<01:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9360, LAS: 0.8807, UEM: 0.5238, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4714, partial_loss/deprel_loss: 0.5702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6828, loss: 0.8027, batch_reg_loss: 0.1324, reg_loss: 0.1323 ||: 12%|#1 | 11/95 [00:07<00:58, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9424, LAS: 0.8876, UEM: 0.5878, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2110, partial_loss/deprel_loss: 0.4511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5355, loss: 0.7549, batch_reg_loss: 0.1325, reg_loss: 0.1323 ||: 16%|#5 | 15/95 [00:10<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9433, LAS: 0.8887, UEM: 0.5881, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.7440, batch_reg_loss: 0.1325, reg_loss: 0.1324 ||: 19%|#8 | 18/95 [00:12<00:56, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9392, LAS: 0.8839, UEM: 0.5833, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2968, partial_loss/deprel_loss: 0.4036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.7767, batch_reg_loss: 0.1326, reg_loss: 0.1324 ||: 23%|##3 | 22/95 [00:15<00:51, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9424, LAS: 0.8877, UEM: 0.6161, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3311, partial_loss/deprel_loss: 0.5547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6426, loss: 0.7507, batch_reg_loss: 0.1327, reg_loss: 0.1324 ||: 27%|##7 | 26/95 [00:18<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9437, LAS: 0.8891, UEM: 0.6301, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5761, loss: 0.7341, batch_reg_loss: 0.1327, reg_loss: 0.1325 ||: 31%|### | 29/95 [00:20<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9429, LAS: 0.8883, UEM: 0.6261, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7372, partial_loss/deprel_loss: 0.7821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 0.7425, batch_reg_loss: 0.1328, reg_loss: 0.1325 ||: 35%|###4 | 33/95 [00:22<00:42, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.9407, LAS: 0.8858, UEM: 0.6095, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5700, partial_loss/deprel_loss: 1.0050, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2509, loss: 0.7631, batch_reg_loss: 0.1328, reg_loss: 0.1325 ||: 39%|###8 | 37/95 [00:25<00:38, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9395, LAS: 0.8842, UEM: 0.5960, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5814, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8719, loss: 0.7767, batch_reg_loss: 0.1329, reg_loss: 0.1326 ||: 42%|####2 | 40/95 [00:27<00:36, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9399, LAS: 0.8844, UEM: 0.5876, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6151, partial_loss/deprel_loss: 0.7105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8243, loss: 0.7740, batch_reg_loss: 0.1329, reg_loss: 0.1326 ||: 45%|####5 | 43/95 [00:29<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9370, LAS: 0.8810, UEM: 0.5682, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5969, partial_loss/deprel_loss: 0.7569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8579, loss: 0.7990, batch_reg_loss: 0.1330, reg_loss: 0.1326 ||: 49%|####9 | 47/95 [00:31<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9387, LAS: 0.8830, UEM: 0.5834, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.4182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5218, loss: 0.7847, batch_reg_loss: 0.1331, reg_loss: 0.1326 ||: 53%|#####2 | 50/95 [00:34<00:31, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9390, LAS: 0.8832, UEM: 0.5795, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6686, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8722, loss: 0.7829, batch_reg_loss: 0.1331, reg_loss: 0.1327 ||: 56%|#####5 | 53/95 [00:36<00:29, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9390, LAS: 0.8832, UEM: 0.5714, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4463, partial_loss/deprel_loss: 0.5824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6884, loss: 0.7834, batch_reg_loss: 0.1332, reg_loss: 0.1327 ||: 59%|#####8 | 56/95 [00:38<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9398, LAS: 0.8838, UEM: 0.5810, LEM: 0.3198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6588, loss: 0.7789, batch_reg_loss: 0.1333, reg_loss: 0.1327 ||: 62%|######2 | 59/95 [00:40<00:26, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9388, LAS: 0.8827, UEM: 0.5779, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1482, partial_loss/deprel_loss: 0.4166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4963, loss: 0.7892, batch_reg_loss: 0.1333, reg_loss: 0.1328 ||: 66%|######6 | 63/95 [00:43<00:22, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9391, LAS: 0.8832, UEM: 0.5753, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.5615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6668, loss: 0.7859, batch_reg_loss: 0.1334, reg_loss: 0.1328 ||: 69%|######9 | 66/95 [00:45<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9396, LAS: 0.8837, UEM: 0.5836, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1483, partial_loss/deprel_loss: 0.3676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4572, loss: 0.7803, batch_reg_loss: 0.1335, reg_loss: 0.1328 ||: 74%|#######3 | 70/95 [00:48<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7856, UAS: 0.9378, LAS: 0.8816, UEM: 0.5722, LEM: 0.3161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9450, partial_loss/deprel_loss: 1.2410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5154, loss: 0.7974, batch_reg_loss: 0.1335, reg_loss: 0.1329 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9365, LAS: 0.8803, UEM: 0.5662, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9895, partial_loss/deprel_loss: 0.9200, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0675, loss: 0.8079, batch_reg_loss: 0.1336, reg_loss: 0.1329 ||: 82%|########2 | 78/95 [00:53<00:11, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9369, LAS: 0.8808, UEM: 0.5785, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0708, partial_loss/deprel_loss: 0.1772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2896, loss: 0.8039, batch_reg_loss: 0.1337, reg_loss: 0.1329 ||: 86%|########6 | 82/95 [00:56<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9366, LAS: 0.8805, UEM: 0.5736, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1568, partial_loss/deprel_loss: 1.0099, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1730, loss: 0.8072, batch_reg_loss: 0.1338, reg_loss: 0.1330 ||: 89%|########9 | 85/95 [00:58<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9356, LAS: 0.8793, UEM: 0.5682, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4791, partial_loss/deprel_loss: 1.0106, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2382, loss: 0.8170, batch_reg_loss: 0.1338, reg_loss: 0.1330 ||: 94%|#########3| 89/95 [01:01<00:04, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9363, LAS: 0.8801, UEM: 0.5704, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6599, partial_loss/deprel_loss: 0.7541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8692, loss: 0.8104, batch_reg_loss: 0.1339, reg_loss: 0.1330 ||: 98%|#########7| 93/95 [01:03<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9361, LAS: 0.8797, UEM: 0.5673, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0906, partial_loss/deprel_loss: 0.9511, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1129, loss: 0.8123, batch_reg_loss: 0.1340, reg_loss: 0.1331 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - reg_loss | 0.133 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - UEM | 0.567 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - LEM | 0.321 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EM | 0.836 | N/A\n", + "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.091 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.951 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - loss | 0.812 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - LAS | 0.880 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:14,541 - INFO - combo.training.trainer - Epoch duration: 0:01:05.204106\n", + "2023-04-06 23:39:14,541 - INFO - combo.training.trainer - Estimated training time remaining: 6:41:37\n", + "2023-04-06 23:39:14,541 - INFO - allennlp.training.trainer - Epoch 44/399\n", + "2023-04-06 23:39:14,541 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:39:14,542 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:39:14,548 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9467, LAS: 0.8917, UEM: 0.4808, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7321, loss: 0.7410, batch_reg_loss: 0.1340, reg_loss: 0.1340 ||: 3%|3 | 3/95 [00:02<01:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9530, LAS: 0.8992, UEM: 0.5987, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1523, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4438, loss: 0.6830, batch_reg_loss: 0.1341, reg_loss: 0.1340 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9495, LAS: 0.8961, UEM: 0.5836, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5068, partial_loss/deprel_loss: 0.6826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7815, loss: 0.7073, batch_reg_loss: 0.1341, reg_loss: 0.1340 ||: 9%|9 | 9/95 [00:06<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9483, LAS: 0.8941, UEM: 0.5763, LEM: 0.2967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.5206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6077, loss: 0.7241, batch_reg_loss: 0.1342, reg_loss: 0.1341 ||: 14%|#3 | 13/95 [00:08<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9498, LAS: 0.8967, UEM: 0.5941, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.4274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7078, batch_reg_loss: 0.1342, reg_loss: 0.1341 ||: 17%|#6 | 16/95 [00:10<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9483, LAS: 0.8945, UEM: 0.5725, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6361, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7920, loss: 0.7192, batch_reg_loss: 0.1343, reg_loss: 0.1341 ||: 21%|##1 | 20/95 [00:13<00:48, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9460, LAS: 0.8921, UEM: 0.5715, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4193, partial_loss/deprel_loss: 0.6510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.7372, batch_reg_loss: 0.1344, reg_loss: 0.1342 ||: 24%|##4 | 23/95 [00:15<00:47, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9434, LAS: 0.8882, UEM: 0.5545, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2756, partial_loss/deprel_loss: 0.4521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.7633, batch_reg_loss: 0.1344, reg_loss: 0.1342 ||: 28%|##8 | 27/95 [00:17<00:43, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9439, LAS: 0.8889, UEM: 0.5700, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4635, partial_loss/deprel_loss: 0.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.7591, batch_reg_loss: 0.1345, reg_loss: 0.1342 ||: 33%|###2 | 31/95 [00:20<00:41, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9427, LAS: 0.8874, UEM: 0.5599, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5730, loss: 0.7653, batch_reg_loss: 0.1346, reg_loss: 0.1343 ||: 37%|###6 | 35/95 [00:23<00:40, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9389, LAS: 0.8834, UEM: 0.5573, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.4254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5128, loss: 0.7916, batch_reg_loss: 0.1347, reg_loss: 0.1343 ||: 41%|####1 | 39/95 [00:25<00:36, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9398, LAS: 0.8849, UEM: 0.5937, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1354, partial_loss/deprel_loss: 0.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1411, loss: 0.7816, batch_reg_loss: 0.1347, reg_loss: 0.1343 ||: 44%|####4 | 42/95 [00:28<00:37, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9413, LAS: 0.8865, UEM: 0.6106, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1261, partial_loss/deprel_loss: 0.3357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4286, loss: 0.7688, batch_reg_loss: 0.1348, reg_loss: 0.1344 ||: 47%|####7 | 45/95 [00:30<00:36, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8616, UAS: 0.9401, LAS: 0.8851, UEM: 0.6033, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7775, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9043, loss: 0.7779, batch_reg_loss: 0.1348, reg_loss: 0.1344 ||: 51%|##### | 48/95 [00:32<00:34, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9393, LAS: 0.8844, UEM: 0.5934, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0858, partial_loss/deprel_loss: 0.9209, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0888, loss: 0.7858, batch_reg_loss: 0.1349, reg_loss: 0.1344 ||: 54%|#####3 | 51/95 [00:34<00:32, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9394, LAS: 0.8846, UEM: 0.5909, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.7819, batch_reg_loss: 0.1350, reg_loss: 0.1345 ||: 57%|#####6 | 54/95 [00:37<00:30, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9394, LAS: 0.8846, UEM: 0.5911, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4536, partial_loss/deprel_loss: 1.1444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3413, loss: 0.7833, batch_reg_loss: 0.1350, reg_loss: 0.1345 ||: 61%|######1 | 58/95 [00:39<00:25, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9399, LAS: 0.8851, UEM: 0.6075, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2542, partial_loss/deprel_loss: 0.4055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.7784, batch_reg_loss: 0.1351, reg_loss: 0.1345 ||: 64%|######4 | 61/95 [00:41<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9386, LAS: 0.8836, UEM: 0.6004, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0466, partial_loss/deprel_loss: 0.9946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1402, loss: 0.7893, batch_reg_loss: 0.1351, reg_loss: 0.1346 ||: 67%|######7 | 64/95 [00:44<00:22, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9380, LAS: 0.8827, UEM: 0.5919, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7341, partial_loss/deprel_loss: 0.8138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9330, loss: 0.7970, batch_reg_loss: 0.1352, reg_loss: 0.1346 ||: 71%|####### | 67/95 [00:46<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9381, LAS: 0.8826, UEM: 0.5893, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1434, partial_loss/deprel_loss: 1.0298, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1878, loss: 0.7969, batch_reg_loss: 0.1353, reg_loss: 0.1346 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9379, LAS: 0.8824, UEM: 0.5830, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8588, partial_loss/deprel_loss: 0.8827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0132, loss: 0.7989, batch_reg_loss: 0.1353, reg_loss: 0.1346 ||: 78%|#######7 | 74/95 [00:50<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9370, LAS: 0.8813, UEM: 0.5752, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8835, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0087, loss: 0.8073, batch_reg_loss: 0.1354, reg_loss: 0.1347 ||: 81%|########1 | 77/95 [00:53<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9360, LAS: 0.8800, UEM: 0.5718, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7483, partial_loss/deprel_loss: 0.8180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9395, loss: 0.8174, batch_reg_loss: 0.1354, reg_loss: 0.1347 ||: 84%|########4 | 80/95 [00:55<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9362, LAS: 0.8801, UEM: 0.5681, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4420, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.8163, batch_reg_loss: 0.1355, reg_loss: 0.1347 ||: 87%|########7 | 83/95 [00:57<00:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9367, LAS: 0.8806, UEM: 0.5683, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6559, partial_loss/deprel_loss: 0.7691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8820, loss: 0.8131, batch_reg_loss: 0.1356, reg_loss: 0.1348 ||: 91%|######### | 86/95 [00:59<00:06, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9372, LAS: 0.8813, UEM: 0.5741, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2528, partial_loss/deprel_loss: 0.3779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8076, batch_reg_loss: 0.1356, reg_loss: 0.1348 ||: 94%|#########3| 89/95 [01:02<00:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9369, LAS: 0.8811, UEM: 0.5679, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4904, partial_loss/deprel_loss: 0.6834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7805, loss: 0.8105, batch_reg_loss: 0.1357, reg_loss: 0.1348 ||: 98%|#########7| 93/95 [01:04<00:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9364, LAS: 0.8805, UEM: 0.5661, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4135, partial_loss/deprel_loss: 0.5995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.8161, batch_reg_loss: 0.1357, reg_loss: 0.1348 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer - reg_loss | 0.135 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UEM | 0.566 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LEM | 0.320 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EM | 0.896 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.413 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.599 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - loss | 0.816 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LAS | 0.880 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:40:20,625 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:40:20,625 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:40:20,625 - INFO - combo.training.trainer - Epoch duration: 0:01:06.084070\n", + "2023-04-06 23:40:20,625 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:17\n", + "2023-04-06 23:40:20,625 - INFO - allennlp.training.trainer - Epoch 45/399\n", + "2023-04-06 23:40:20,626 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:40:20,626 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:40:20,633 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9494, LAS: 0.8960, UEM: 0.6741, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.4747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5676, loss: 0.6745, batch_reg_loss: 0.1358, reg_loss: 0.1358 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9461, LAS: 0.8939, UEM: 0.6654, LEM: 0.4282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8130, partial_loss/deprel_loss: 0.8523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9803, loss: 0.7075, batch_reg_loss: 0.1359, reg_loss: 0.1358 ||: 6%|6 | 6/95 [00:04<01:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9465, LAS: 0.8949, UEM: 0.6410, LEM: 0.3850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 0.5640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7026, batch_reg_loss: 0.1359, reg_loss: 0.1358 ||: 9%|9 | 9/95 [00:07<01:05, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9419, LAS: 0.8882, UEM: 0.5945, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.7535, batch_reg_loss: 0.1360, reg_loss: 0.1359 ||: 14%|#3 | 13/95 [00:09<00:59, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9455, LAS: 0.8920, UEM: 0.6111, LEM: 0.3359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.7311, batch_reg_loss: 0.1361, reg_loss: 0.1359 ||: 18%|#7 | 17/95 [00:12<00:54, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9452, LAS: 0.8924, UEM: 0.6389, LEM: 0.4000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0746, partial_loss/deprel_loss: 0.2032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3136, loss: 0.7316, batch_reg_loss: 0.1361, reg_loss: 0.1360 ||: 22%|##2 | 21/95 [00:15<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9440, LAS: 0.8908, UEM: 0.6519, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1294, partial_loss/deprel_loss: 0.2705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3784, loss: 0.7436, batch_reg_loss: 0.1362, reg_loss: 0.1360 ||: 25%|##5 | 24/95 [00:17<00:50, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9409, LAS: 0.8871, UEM: 0.6308, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.4021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.7703, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||: 29%|##9 | 28/95 [00:19<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8388, UAS: 0.9407, LAS: 0.8870, UEM: 0.6304, LEM: 0.3968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3034, partial_loss/deprel_loss: 1.0082, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2036, loss: 0.7726, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||: 33%|###2 | 31/95 [00:22<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9405, LAS: 0.8862, UEM: 0.6244, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0059, partial_loss/deprel_loss: 0.9191, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0729, loss: 0.7778, batch_reg_loss: 0.1364, reg_loss: 0.1361 ||: 37%|###6 | 35/95 [00:24<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9416, LAS: 0.8876, UEM: 0.6220, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2988, partial_loss/deprel_loss: 0.4795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.7673, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||: 41%|####1 | 39/95 [00:27<00:39, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9422, LAS: 0.8883, UEM: 0.6175, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2808, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.7585, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||: 45%|####5 | 43/95 [00:30<00:36, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9432, LAS: 0.8891, UEM: 0.6218, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6001, loss: 0.7497, batch_reg_loss: 0.1366, reg_loss: 0.1362 ||: 48%|####8 | 46/95 [00:32<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9402, LAS: 0.8859, UEM: 0.6066, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1341, partial_loss/deprel_loss: 0.9265, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1047, loss: 0.7741, batch_reg_loss: 0.1366, reg_loss: 0.1362 ||: 53%|#####2 | 50/95 [00:35<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9400, LAS: 0.8856, UEM: 0.6022, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1163, partial_loss/deprel_loss: 0.9497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1197, loss: 0.7758, batch_reg_loss: 0.1367, reg_loss: 0.1362 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9403, LAS: 0.8859, UEM: 0.5938, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.5982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7146, loss: 0.7762, batch_reg_loss: 0.1368, reg_loss: 0.1363 ||: 60%|###### | 57/95 [00:39<00:25, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9383, LAS: 0.8835, UEM: 0.5834, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4552, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.7948, batch_reg_loss: 0.1368, reg_loss: 0.1363 ||: 64%|######4 | 61/95 [00:42<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9387, LAS: 0.8840, UEM: 0.5977, LEM: 0.3522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1554, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4515, loss: 0.7900, batch_reg_loss: 0.1369, reg_loss: 0.1363 ||: 68%|######8 | 65/95 [00:45<00:20, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9384, LAS: 0.8836, UEM: 0.5927, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2767, partial_loss/deprel_loss: 0.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.7931, batch_reg_loss: 0.1370, reg_loss: 0.1364 ||: 73%|#######2 | 69/95 [00:47<00:17, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9378, LAS: 0.8831, UEM: 0.5895, LEM: 0.3445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.5303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.7963, batch_reg_loss: 0.1371, reg_loss: 0.1364 ||: 76%|#######5 | 72/95 [00:50<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9361, LAS: 0.8812, UEM: 0.5811, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6207, partial_loss/deprel_loss: 0.7086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8281, loss: 0.8108, batch_reg_loss: 0.1371, reg_loss: 0.1364 ||: 79%|#######8 | 75/95 [00:52<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9360, LAS: 0.8810, UEM: 0.5781, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.8120, batch_reg_loss: 0.1372, reg_loss: 0.1365 ||: 83%|########3 | 79/95 [00:54<00:10, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9366, LAS: 0.8815, UEM: 0.5757, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4516, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7467, loss: 0.8091, batch_reg_loss: 0.1373, reg_loss: 0.1365 ||: 87%|########7 | 83/95 [00:57<00:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9357, LAS: 0.8802, UEM: 0.5671, LEM: 0.3249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8374, partial_loss/deprel_loss: 0.8827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0110, loss: 0.8188, batch_reg_loss: 0.1374, reg_loss: 0.1365 ||: 91%|######### | 86/95 [01:00<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9362, LAS: 0.8807, UEM: 0.5675, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6649, loss: 0.8156, batch_reg_loss: 0.1374, reg_loss: 0.1366 ||: 94%|#########3| 89/95 [01:02<00:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9362, LAS: 0.8807, UEM: 0.5685, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9220, partial_loss/deprel_loss: 0.8461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9988, loss: 0.8153, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||: 97%|#########6| 92/95 [01:04<00:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9362, LAS: 0.8807, UEM: 0.5664, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4165, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6799, loss: 0.8159, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||: 100%|##########| 95/95 [01:06<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9362, LAS: 0.8807, UEM: 0.5664, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4165, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6799, loss: 0.8159, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-06 23:41:27,404 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9165, LAS: 0.8550, UEM: 0.1988, LEM: 0.0361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8586, partial_loss/deprel_loss: 44.4118, partial_loss/cycle_loss: 0.0000, batch_loss: 35.7012, loss: 41.2754, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9456, LAS: 0.8943, UEM: 0.7281, LEM: 0.4981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2232, partial_loss/deprel_loss: 22.5852, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1128, loss: 27.1635, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9451, LAS: 0.8918, UEM: 0.6742, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 33.8063, partial_loss/cycle_loss: 0.0000, batch_loss: 27.2165, loss: 28.1215, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:08<00:03, 1.01s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9469, LAS: 0.8927, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 24.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3482, loss: 26.4357, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9469, LAS: 0.8927, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 24.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3482, loss: 26.4357, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.05it/s]\n", + "2023-04-06 23:41:37,888 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - reg_loss | 0.137 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UEM | 0.566 | 0.667\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - LEM | 0.322 | 0.398\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EM | 0.906 | 0.915\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.416 | 0.362\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | 0.947\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.574 | 24.095\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - loss | 0.816 | 26.436\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - LAS | 0.881 | 0.893\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:41:37,891 - INFO - combo.training.trainer - Epoch duration: 0:01:17.265210\n", + "2023-04-06 23:41:37,891 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:23\n", + "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - Epoch 46/399\n", + "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:41:37,898 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9384, LAS: 0.8818, UEM: 0.3734, LEM: 0.1384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8249, partial_loss/deprel_loss: 0.9382, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0532, loss: 0.8264, batch_reg_loss: 0.1376, reg_loss: 0.1376 ||: 3%|3 | 3/95 [00:02<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9417, LAS: 0.8873, UEM: 0.4747, LEM: 0.2218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6840, partial_loss/deprel_loss: 0.7449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8704, loss: 0.7841, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9425, LAS: 0.8875, UEM: 0.4812, LEM: 0.2071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3713, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6839, loss: 0.7722, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||: 11%|# | 10/95 [00:06<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8354, UAS: 0.9372, LAS: 0.8831, UEM: 0.4905, LEM: 0.2360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3465, partial_loss/deprel_loss: 0.9104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1354, loss: 0.7935, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||: 15%|#4 | 14/95 [00:09<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9297, LAS: 0.8741, UEM: 0.4456, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1434, partial_loss/deprel_loss: 0.9181, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1010, loss: 0.8644, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||: 19%|#8 | 18/95 [00:11<00:49, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9280, LAS: 0.8725, UEM: 0.4833, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3145, partial_loss/deprel_loss: 1.0498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2407, loss: 0.8758, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||: 22%|##2 | 21/95 [00:13<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9286, LAS: 0.8732, UEM: 0.4933, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5604, loss: 0.8730, batch_reg_loss: 0.1380, reg_loss: 0.1378 ||: 25%|##5 | 24/95 [00:17<01:01, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8390, UAS: 0.9300, LAS: 0.8744, UEM: 0.4931, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1832, partial_loss/deprel_loss: 0.9521, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1364, loss: 0.8631, batch_reg_loss: 0.1381, reg_loss: 0.1378 ||: 29%|##9 | 28/95 [00:20<00:53, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9325, LAS: 0.8773, UEM: 0.5136, LEM: 0.2703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3778, partial_loss/deprel_loss: 0.5454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6501, loss: 0.8409, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||: 34%|###3 | 32/95 [00:22<00:47, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9315, LAS: 0.8762, UEM: 0.5065, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0980, partial_loss/deprel_loss: 0.9244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0973, loss: 0.8481, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||: 37%|###6 | 35/95 [00:25<00:43, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8415, UAS: 0.9277, LAS: 0.8720, UEM: 0.4886, LEM: 0.2554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 0.8297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9971, loss: 0.8780, batch_reg_loss: 0.1383, reg_loss: 0.1379 ||: 40%|#### | 38/95 [00:27<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9306, LAS: 0.8754, UEM: 0.5315, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1455, partial_loss/deprel_loss: 0.3835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.8522, batch_reg_loss: 0.1384, reg_loss: 0.1379 ||: 43%|####3 | 41/95 [00:29<00:40, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9326, LAS: 0.8776, UEM: 0.5548, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6045, loss: 0.8329, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||: 46%|####6 | 44/95 [00:32<00:39, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9335, LAS: 0.8787, UEM: 0.5579, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2463, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5704, loss: 0.8267, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||: 49%|####9 | 47/95 [00:34<00:37, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9340, LAS: 0.8793, UEM: 0.5501, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4458, partial_loss/deprel_loss: 0.5934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7024, loss: 0.8208, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||: 53%|#####2 | 50/95 [00:36<00:34, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9337, LAS: 0.8787, UEM: 0.5367, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9964, partial_loss/deprel_loss: 0.8618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0273, loss: 0.8244, batch_reg_loss: 0.1386, reg_loss: 0.1381 ||: 57%|#####6 | 54/95 [00:39<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9349, LAS: 0.8801, UEM: 0.5640, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3095, loss: 0.8150, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||: 60%|###### | 57/95 [00:41<00:28, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9348, LAS: 0.8798, UEM: 0.5555, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9198, partial_loss/deprel_loss: 0.8242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9821, loss: 0.8174, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||: 64%|######4 | 61/95 [00:44<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9352, LAS: 0.8805, UEM: 0.5606, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5460, loss: 0.8125, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||: 67%|######7 | 64/95 [00:46<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9360, LAS: 0.8814, UEM: 0.5732, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4190, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6808, loss: 0.8043, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||: 71%|####### | 67/95 [00:48<00:21, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9370, LAS: 0.8826, UEM: 0.5785, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5879, loss: 0.7951, batch_reg_loss: 0.1389, reg_loss: 0.1382 ||: 74%|#######3 | 70/95 [00:50<00:18, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9369, LAS: 0.8826, UEM: 0.5706, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6230, partial_loss/deprel_loss: 0.6653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7957, loss: 0.7966, batch_reg_loss: 0.1389, reg_loss: 0.1383 ||: 78%|#######7 | 74/95 [00:53<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9375, LAS: 0.8832, UEM: 0.5774, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4835, partial_loss/deprel_loss: 0.6329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7420, loss: 0.7910, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||: 81%|########1 | 77/95 [00:55<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9379, LAS: 0.8836, UEM: 0.5761, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4014, partial_loss/deprel_loss: 0.5538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7882, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||: 84%|########4 | 80/95 [00:58<00:11, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9377, LAS: 0.8832, UEM: 0.5691, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7767, loss: 0.7916, batch_reg_loss: 0.1391, reg_loss: 0.1383 ||: 87%|########7 | 83/95 [01:00<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9374, LAS: 0.8828, UEM: 0.5665, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4622, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 0.7948, batch_reg_loss: 0.1391, reg_loss: 0.1384 ||: 91%|######### | 86/95 [01:02<00:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9382, LAS: 0.8835, UEM: 0.5720, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.7901, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||: 95%|#########4| 90/95 [01:04<00:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9367, LAS: 0.8818, UEM: 0.5672, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5604, partial_loss/deprel_loss: 0.7168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8248, loss: 0.8043, batch_reg_loss: 0.1393, reg_loss: 0.1384 ||: 98%|#########7| 93/95 [01:07<00:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8415, UAS: 0.9359, LAS: 0.8809, UEM: 0.5622, LEM: 0.3202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0151, partial_loss/deprel_loss: 0.9374, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0923, loss: 0.8117, batch_reg_loss: 0.1393, reg_loss: 0.1385 ||: 100%|##########| 95/95 [01:08<00:00, 1.39it/s]\n", + "2023-04-06 23:42:46,421 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:42:46,421 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - reg_loss | 0.138 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UEM | 0.562 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - LEM | 0.320 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EM | 0.841 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.015 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.937 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - loss | 0.812 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - LAS | 0.881 | N/A\n", + "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:46,423 - INFO - combo.training.trainer - Epoch duration: 0:01:08.532568\n", + "2023-04-06 23:42:46,424 - INFO - combo.training.trainer - Estimated training time remaining: 6:39:20\n", + "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - Epoch 47/399\n", + "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:42:46,431 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9575, LAS: 0.9058, UEM: 0.6646, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2918, partial_loss/deprel_loss: 0.5193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6131, loss: 0.6360, batch_reg_loss: 0.1394, reg_loss: 0.1393 ||: 4%|4 | 4/95 [00:02<00:59, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9441, LAS: 0.8906, UEM: 0.5665, LEM: 0.2927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7484, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8196, loss: 0.7513, batch_reg_loss: 0.1394, reg_loss: 0.1394 ||: 7%|7 | 7/95 [00:04<00:59, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9357, LAS: 0.8795, UEM: 0.5114, LEM: 0.2450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7294, partial_loss/deprel_loss: 0.8087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9323, loss: 0.8303, batch_reg_loss: 0.1395, reg_loss: 0.1394 ||: 11%|# | 10/95 [00:06<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9358, LAS: 0.8801, UEM: 0.5003, LEM: 0.2286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.5388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6632, loss: 0.8273, batch_reg_loss: 0.1396, reg_loss: 0.1394 ||: 15%|#4 | 14/95 [00:09<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9353, LAS: 0.8802, UEM: 0.5093, LEM: 0.2462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9208, partial_loss/deprel_loss: 0.8924, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0377, loss: 0.8179, batch_reg_loss: 0.1396, reg_loss: 0.1395 ||: 18%|#7 | 17/95 [00:11<00:52, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9352, LAS: 0.8805, UEM: 0.5340, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1473, partial_loss/deprel_loss: 0.3474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.8197, batch_reg_loss: 0.1397, reg_loss: 0.1395 ||: 21%|##1 | 20/95 [00:13<00:50, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9339, LAS: 0.8791, UEM: 0.5085, LEM: 0.2634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6413, partial_loss/deprel_loss: 0.7258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8486, loss: 0.8335, batch_reg_loss: 0.1397, reg_loss: 0.1395 ||: 24%|##4 | 23/95 [00:15<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9361, LAS: 0.8817, UEM: 0.5197, LEM: 0.2742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.8120, batch_reg_loss: 0.1398, reg_loss: 0.1396 ||: 28%|##8 | 27/95 [00:17<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9333, LAS: 0.8783, UEM: 0.5124, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2833, partial_loss/deprel_loss: 0.4738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5756, loss: 0.8371, batch_reg_loss: 0.1399, reg_loss: 0.1396 ||: 33%|###2 | 31/95 [00:20<00:42, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9354, LAS: 0.8807, UEM: 0.5301, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3344, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6285, loss: 0.8172, batch_reg_loss: 0.1400, reg_loss: 0.1396 ||: 36%|###5 | 34/95 [00:22<00:40, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9624, UAS: 0.9366, LAS: 0.8821, UEM: 0.5833, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0444, partial_loss/deprel_loss: 0.1539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2721, loss: 0.8122, batch_reg_loss: 0.1400, reg_loss: 0.1397 ||: 40%|#### | 38/95 [00:25<00:39, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9361, LAS: 0.8817, UEM: 0.5872, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7777, loss: 0.8153, batch_reg_loss: 0.1401, reg_loss: 0.1397 ||: 43%|####3 | 41/95 [00:27<00:38, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9361, LAS: 0.8814, UEM: 0.5756, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.6801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8021, loss: 0.8151, batch_reg_loss: 0.1401, reg_loss: 0.1397 ||: 46%|####6 | 44/95 [00:30<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9373, LAS: 0.8827, UEM: 0.5772, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4436, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6934, loss: 0.8048, batch_reg_loss: 0.1402, reg_loss: 0.1398 ||: 49%|####9 | 47/95 [00:32<00:34, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9379, LAS: 0.8836, UEM: 0.5798, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9289, partial_loss/deprel_loss: 0.8450, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0020, loss: 0.7981, batch_reg_loss: 0.1403, reg_loss: 0.1398 ||: 53%|#####2 | 50/95 [00:34<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9365, LAS: 0.8819, UEM: 0.5754, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.6077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6992, loss: 0.8102, batch_reg_loss: 0.1403, reg_loss: 0.1398 ||: 57%|#####6 | 54/95 [00:37<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9375, LAS: 0.8828, UEM: 0.5777, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3133, partial_loss/deprel_loss: 0.5667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6564, loss: 0.8034, batch_reg_loss: 0.1404, reg_loss: 0.1399 ||: 60%|###### | 57/95 [00:39<00:27, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9369, LAS: 0.8822, UEM: 0.5702, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8833, partial_loss/deprel_loss: 0.8060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9619, loss: 0.8088, batch_reg_loss: 0.1404, reg_loss: 0.1399 ||: 63%|######3 | 60/95 [00:41<00:25, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9369, LAS: 0.8819, UEM: 0.5634, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5471, partial_loss/deprel_loss: 0.8084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8966, loss: 0.8110, batch_reg_loss: 0.1405, reg_loss: 0.1399 ||: 66%|######6 | 63/95 [00:43<00:23, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9372, LAS: 0.8823, UEM: 0.5600, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5296, partial_loss/deprel_loss: 0.6012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7274, loss: 0.8069, batch_reg_loss: 0.1405, reg_loss: 0.1399 ||: 71%|####### | 67/95 [00:46<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9369, LAS: 0.8821, UEM: 0.5693, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4940, partial_loss/deprel_loss: 0.6594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7669, loss: 0.8081, batch_reg_loss: 0.1406, reg_loss: 0.1400 ||: 74%|#######3 | 70/95 [00:48<00:17, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9382, LAS: 0.8836, UEM: 0.5848, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1530, partial_loss/deprel_loss: 0.3817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4766, loss: 0.7969, batch_reg_loss: 0.1407, reg_loss: 0.1400 ||: 77%|#######6 | 73/95 [00:51<00:16, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9379, LAS: 0.8833, UEM: 0.5780, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2605, partial_loss/deprel_loss: 1.0438, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2278, loss: 0.7990, batch_reg_loss: 0.1407, reg_loss: 0.1400 ||: 81%|########1 | 77/95 [00:53<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9381, LAS: 0.8834, UEM: 0.5851, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2065, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5310, loss: 0.7956, batch_reg_loss: 0.1408, reg_loss: 0.1401 ||: 84%|########4 | 80/95 [00:55<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9380, LAS: 0.8832, UEM: 0.5787, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3494, partial_loss/deprel_loss: 0.4998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6105, loss: 0.7982, batch_reg_loss: 0.1408, reg_loss: 0.1401 ||: 88%|########8 | 84/95 [00:57<00:07, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9373, LAS: 0.8823, UEM: 0.5795, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1643, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.8058, batch_reg_loss: 0.1409, reg_loss: 0.1401 ||: 93%|#########2| 88/95 [01:00<00:04, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9373, LAS: 0.8821, UEM: 0.5728, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5563, partial_loss/deprel_loss: 0.6610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7810, loss: 0.8073, batch_reg_loss: 0.1410, reg_loss: 0.1402 ||: 97%|#########6| 92/95 [01:02<00:01, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9364, LAS: 0.8810, UEM: 0.5686, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6867, loss: 0.8150, batch_reg_loss: 0.1410, reg_loss: 0.1402 ||: 100%|##########| 95/95 [01:03<00:00, 1.48it/s]\n", + "2023-04-06 23:43:50,414 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - reg_loss | 0.140 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UEM | 0.569 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LEM | 0.322 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EM | 0.890 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.371 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.589 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - loss | 0.815 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LAS | 0.881 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:43:50,416 - INFO - combo.training.trainer - Epoch duration: 0:01:03.992550\n", + "2023-04-06 23:43:50,416 - INFO - combo.training.trainer - Estimated training time remaining: 6:37:44\n", + "2023-04-06 23:43:50,416 - INFO - allennlp.training.trainer - Epoch 48/399\n", + "2023-04-06 23:43:50,416 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:43:50,417 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:43:50,430 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9246, LAS: 0.8706, UEM: 0.3107, LEM: 0.1247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4508, partial_loss/deprel_loss: 0.6146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7229, loss: 0.8960, batch_reg_loss: 0.1411, reg_loss: 0.1411 ||: 4%|4 | 4/95 [00:02<00:53, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9396, LAS: 0.8903, UEM: 0.6835, LEM: 0.5249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0651, partial_loss/deprel_loss: 0.1912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3071, loss: 0.7490, batch_reg_loss: 0.1411, reg_loss: 0.1411 ||: 6%|6 | 6/95 [00:04<01:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9430, LAS: 0.8921, UEM: 0.6491, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.7309, batch_reg_loss: 0.1412, reg_loss: 0.1411 ||: 9%|9 | 9/95 [00:06<01:04, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9407, LAS: 0.8877, UEM: 0.6194, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0302, partial_loss/deprel_loss: 0.9679, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1216, loss: 0.7598, batch_reg_loss: 0.1412, reg_loss: 0.1411 ||: 13%|#2 | 12/95 [00:09<01:01, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9411, LAS: 0.8879, UEM: 0.6232, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2766, partial_loss/deprel_loss: 0.4543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.7571, batch_reg_loss: 0.1413, reg_loss: 0.1412 ||: 16%|#5 | 15/95 [00:11<01:00, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9362, LAS: 0.8814, UEM: 0.5813, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5272, partial_loss/deprel_loss: 0.6339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8038, batch_reg_loss: 0.1414, reg_loss: 0.1412 ||: 20%|## | 19/95 [00:13<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9384, LAS: 0.8840, UEM: 0.5813, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6809, partial_loss/deprel_loss: 0.7209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8544, loss: 0.7911, batch_reg_loss: 0.1414, reg_loss: 0.1412 ||: 23%|##3 | 22/95 [00:15<00:51, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9348, LAS: 0.8805, UEM: 0.5621, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5691, partial_loss/deprel_loss: 0.7029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8176, loss: 0.8155, batch_reg_loss: 0.1415, reg_loss: 0.1413 ||: 27%|##7 | 26/95 [00:18<00:48, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9332, LAS: 0.8784, UEM: 0.5724, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4915, partial_loss/deprel_loss: 0.6467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7572, loss: 0.8279, batch_reg_loss: 0.1416, reg_loss: 0.1413 ||: 31%|### | 29/95 [00:20<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9330, LAS: 0.8774, UEM: 0.5595, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6215, partial_loss/deprel_loss: 0.8165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9192, loss: 0.8350, batch_reg_loss: 0.1416, reg_loss: 0.1413 ||: 34%|###3 | 32/95 [00:22<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9348, LAS: 0.8798, UEM: 0.5804, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7149, partial_loss/deprel_loss: 0.8073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9305, loss: 0.8176, batch_reg_loss: 0.1417, reg_loss: 0.1414 ||: 37%|###6 | 35/95 [00:25<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8580, UAS: 0.9340, LAS: 0.8788, UEM: 0.5589, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0087, partial_loss/deprel_loss: 0.8536, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0264, loss: 0.8281, batch_reg_loss: 0.1418, reg_loss: 0.1414 ||: 41%|####1 | 39/95 [00:27<00:37, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9362, LAS: 0.8813, UEM: 0.5820, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.8080, batch_reg_loss: 0.1418, reg_loss: 0.1414 ||: 44%|####4 | 42/95 [00:29<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9346, LAS: 0.8795, UEM: 0.5668, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3684, partial_loss/deprel_loss: 0.9809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2003, loss: 0.8222, batch_reg_loss: 0.1419, reg_loss: 0.1415 ||: 48%|####8 | 46/95 [00:32<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8141, UAS: 0.9333, LAS: 0.8780, UEM: 0.5536, LEM: 0.3186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3576, partial_loss/deprel_loss: 0.9825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1995, loss: 0.8312, batch_reg_loss: 0.1420, reg_loss: 0.1415 ||: 53%|#####2 | 50/95 [00:34<00:29, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9332, LAS: 0.8779, UEM: 0.5417, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9766, partial_loss/deprel_loss: 0.8796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0411, loss: 0.8334, batch_reg_loss: 0.1420, reg_loss: 0.1415 ||: 57%|#####6 | 54/95 [00:37<00:26, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9322, LAS: 0.8768, UEM: 0.5268, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7397, partial_loss/deprel_loss: 0.7262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 0.8443, batch_reg_loss: 0.1421, reg_loss: 0.1416 ||: 61%|######1 | 58/95 [00:39<00:23, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9325, LAS: 0.8768, UEM: 0.5299, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9624, partial_loss/deprel_loss: 0.8780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0370, loss: 0.8424, batch_reg_loss: 0.1422, reg_loss: 0.1416 ||: 65%|######5 | 62/95 [00:42<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9343, LAS: 0.8788, UEM: 0.5502, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.8254, batch_reg_loss: 0.1423, reg_loss: 0.1417 ||: 69%|######9 | 66/95 [00:45<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9346, LAS: 0.8791, UEM: 0.5491, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9794, partial_loss/deprel_loss: 0.8978, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0565, loss: 0.8239, batch_reg_loss: 0.1424, reg_loss: 0.1417 ||: 74%|#######3 | 70/95 [00:47<00:16, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9351, LAS: 0.8797, UEM: 0.5488, LEM: 0.3082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6549, partial_loss/deprel_loss: 0.6211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7703, loss: 0.8183, batch_reg_loss: 0.1424, reg_loss: 0.1417 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9350, LAS: 0.8797, UEM: 0.5482, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3373, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6150, loss: 0.8187, batch_reg_loss: 0.1425, reg_loss: 0.1418 ||: 81%|########1 | 77/95 [00:53<00:12, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9360, LAS: 0.8810, UEM: 0.5638, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1284, partial_loss/deprel_loss: 0.2522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3700, loss: 0.8082, batch_reg_loss: 0.1425, reg_loss: 0.1418 ||: 84%|########4 | 80/95 [00:55<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9360, LAS: 0.8809, UEM: 0.5696, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1299, partial_loss/deprel_loss: 0.3227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4267, loss: 0.8099, batch_reg_loss: 0.1426, reg_loss: 0.1418 ||: 87%|########7 | 83/95 [00:57<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9364, LAS: 0.8812, UEM: 0.5652, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5604, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7781, loss: 0.8085, batch_reg_loss: 0.1426, reg_loss: 0.1419 ||: 92%|#########1| 87/95 [00:59<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9360, LAS: 0.8808, UEM: 0.5644, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1008, partial_loss/deprel_loss: 0.9605, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1313, loss: 0.8109, batch_reg_loss: 0.1427, reg_loss: 0.1419 ||: 95%|#########4| 90/95 [01:02<00:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9366, LAS: 0.8813, UEM: 0.5658, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7521, partial_loss/deprel_loss: 0.8806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9976, loss: 0.8087, batch_reg_loss: 0.1428, reg_loss: 0.1419 ||: 99%|#########8| 94/95 [01:04<00:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9362, LAS: 0.8809, UEM: 0.5632, LEM: 0.3208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0050, partial_loss/deprel_loss: 0.9152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0759, loss: 0.8115, batch_reg_loss: 0.1428, reg_loss: 0.1419 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - reg_loss | 0.142 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UEM | 0.563 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - LEM | 0.321 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EM | 0.847 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.005 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UAS | 0.936 | N/A\n", + "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.915 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - loss | 0.811 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - LAS | 0.881 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:44:55,056 - INFO - combo.training.trainer - Epoch duration: 0:01:04.639291\n", + "2023-04-06 23:44:55,056 - INFO - combo.training.trainer - Estimated training time remaining: 6:36:13\n", + "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - Epoch 49/399\n", + "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:44:55,062 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9468, LAS: 0.8951, UEM: 0.5605, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8158, partial_loss/deprel_loss: 0.8483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9846, loss: 0.7297, batch_reg_loss: 0.1428, reg_loss: 0.1428 ||: 4%|4 | 4/95 [00:02<00:46, 1.94it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9492, LAS: 0.8979, UEM: 0.6192, LEM: 0.3542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2337, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.6914, batch_reg_loss: 0.1429, reg_loss: 0.1428 ||: 7%|7 | 7/95 [00:04<00:52, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9468, LAS: 0.8960, UEM: 0.6436, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1523, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.7006, batch_reg_loss: 0.1429, reg_loss: 0.1429 ||: 11%|# | 10/95 [00:06<00:56, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9431, LAS: 0.8893, UEM: 0.5835, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4091, partial_loss/deprel_loss: 0.6584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.7444, batch_reg_loss: 0.1430, reg_loss: 0.1429 ||: 15%|#4 | 14/95 [00:09<00:51, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9415, LAS: 0.8879, UEM: 0.5673, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6671, partial_loss/deprel_loss: 0.6714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8136, loss: 0.7581, batch_reg_loss: 0.1431, reg_loss: 0.1429 ||: 19%|#8 | 18/95 [00:11<00:47, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8277, UAS: 0.9393, LAS: 0.8853, UEM: 0.5465, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3672, partial_loss/deprel_loss: 1.0111, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2254, loss: 0.7825, batch_reg_loss: 0.1431, reg_loss: 0.1430 ||: 22%|##2 | 21/95 [00:13<00:47, 1.57it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9398, LAS: 0.8865, UEM: 0.5490, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2423, partial_loss/deprel_loss: 0.8838, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0987, loss: 0.7780, batch_reg_loss: 0.1432, reg_loss: 0.1430 ||: 26%|##6 | 25/95 [00:16<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9369, LAS: 0.8828, UEM: 0.5379, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.8710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9864, loss: 0.8033, batch_reg_loss: 0.1433, reg_loss: 0.1430 ||: 29%|##9 | 28/95 [00:18<00:44, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9374, LAS: 0.8834, UEM: 0.5485, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1769, partial_loss/deprel_loss: 0.9157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1113, loss: 0.7973, batch_reg_loss: 0.1433, reg_loss: 0.1430 ||: 33%|###2 | 31/95 [00:20<00:43, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9366, LAS: 0.8823, UEM: 0.5334, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7944, loss: 0.8072, batch_reg_loss: 0.1434, reg_loss: 0.1431 ||: 36%|###5 | 34/95 [00:22<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9372, LAS: 0.8830, UEM: 0.5274, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4577, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.8014, batch_reg_loss: 0.1434, reg_loss: 0.1431 ||: 39%|###8 | 37/95 [00:24<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9367, LAS: 0.8823, UEM: 0.5204, LEM: 0.2730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6713, partial_loss/deprel_loss: 0.7439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8729, loss: 0.8124, batch_reg_loss: 0.1435, reg_loss: 0.1431 ||: 42%|####2 | 40/95 [00:26<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9368, LAS: 0.8824, UEM: 0.5301, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1867, partial_loss/deprel_loss: 0.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.8118, batch_reg_loss: 0.1436, reg_loss: 0.1432 ||: 46%|####6 | 44/95 [00:29<00:34, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9372, LAS: 0.8830, UEM: 0.5267, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3491, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6680, loss: 0.8096, batch_reg_loss: 0.1436, reg_loss: 0.1432 ||: 51%|##### | 48/95 [00:31<00:31, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9359, LAS: 0.8816, UEM: 0.5234, LEM: 0.2767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6888, partial_loss/deprel_loss: 1.1994, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4410, loss: 0.8214, batch_reg_loss: 0.1437, reg_loss: 0.1432 ||: 54%|#####3 | 51/95 [00:33<00:29, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9366, LAS: 0.8824, UEM: 0.5644, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0663, partial_loss/deprel_loss: 0.1810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3018, loss: 0.8144, batch_reg_loss: 0.1437, reg_loss: 0.1433 ||: 57%|#####6 | 54/95 [00:36<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9368, LAS: 0.8822, UEM: 0.5618, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.5460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 0.8138, batch_reg_loss: 0.1438, reg_loss: 0.1433 ||: 60%|###### | 57/95 [00:38<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9355, LAS: 0.8809, UEM: 0.5548, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.4428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5435, loss: 0.8239, batch_reg_loss: 0.1439, reg_loss: 0.1433 ||: 64%|######4 | 61/95 [00:40<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9361, LAS: 0.8814, UEM: 0.5611, LEM: 0.3194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3078, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6117, loss: 0.8197, batch_reg_loss: 0.1439, reg_loss: 0.1433 ||: 67%|######7 | 64/95 [00:43<00:21, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9364, LAS: 0.8815, UEM: 0.5533, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7052, partial_loss/deprel_loss: 0.7890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9162, loss: 0.8203, batch_reg_loss: 0.1440, reg_loss: 0.1434 ||: 72%|#######1 | 68/95 [00:45<00:18, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9355, LAS: 0.8806, UEM: 0.5464, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3218, partial_loss/deprel_loss: 0.9959, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2051, loss: 0.8276, batch_reg_loss: 0.1441, reg_loss: 0.1434 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9365, LAS: 0.8817, UEM: 0.5571, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5070, partial_loss/deprel_loss: 0.6505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7659, loss: 0.8192, batch_reg_loss: 0.1441, reg_loss: 0.1434 ||: 79%|#######8 | 75/95 [00:50<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9368, LAS: 0.8820, UEM: 0.5578, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3250, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.8165, batch_reg_loss: 0.1442, reg_loss: 0.1435 ||: 82%|########2 | 78/95 [00:52<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9365, LAS: 0.8816, UEM: 0.5566, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2677, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5191, loss: 0.8171, batch_reg_loss: 0.1442, reg_loss: 0.1435 ||: 85%|########5 | 81/95 [00:55<00:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9363, LAS: 0.8815, UEM: 0.5511, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4442, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8182, batch_reg_loss: 0.1443, reg_loss: 0.1435 ||: 89%|########9 | 85/95 [00:57<00:07, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9373, LAS: 0.8828, UEM: 0.5726, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1108, partial_loss/deprel_loss: 0.2497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3663, loss: 0.8079, batch_reg_loss: 0.1444, reg_loss: 0.1436 ||: 93%|#########2| 88/95 [01:00<00:05, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9376, LAS: 0.8832, UEM: 0.5692, LEM: 0.3286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4735, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6930, loss: 0.8064, batch_reg_loss: 0.1444, reg_loss: 0.1436 ||: 97%|#########6| 92/95 [01:02<00:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9378, LAS: 0.8832, UEM: 0.5714, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5080, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7632, loss: 0.8066, batch_reg_loss: 0.1445, reg_loss: 0.1436 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer - reg_loss | 0.144 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UEM | 0.571 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LEM | 0.330 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EM | 0.888 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.508 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.646 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - loss | 0.807 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LAS | 0.883 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:45:59,941 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:59,941 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:59,941 - INFO - combo.training.trainer - Epoch duration: 0:01:04.885191\n", + "2023-04-06 23:45:59,941 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:46\n", + "2023-04-06 23:45:59,941 - INFO - allennlp.training.trainer - Epoch 50/399\n", + "2023-04-06 23:45:59,941 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:45:59,942 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:45:59,947 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9078, LAS: 0.8507, UEM: 0.3908, LEM: 0.1523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5539, partial_loss/deprel_loss: 0.6880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8057, loss: 1.0078, batch_reg_loss: 0.1445, reg_loss: 0.1445 ||: 3%|3 | 3/95 [00:02<01:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9317, LAS: 0.8766, UEM: 0.5551, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4512, partial_loss/deprel_loss: 0.6208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7314, loss: 0.8406, batch_reg_loss: 0.1446, reg_loss: 0.1445 ||: 6%|6 | 6/95 [00:04<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9265, LAS: 0.8697, UEM: 0.5033, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7658, partial_loss/deprel_loss: 1.1443, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4133, loss: 0.8956, batch_reg_loss: 0.1446, reg_loss: 0.1446 ||: 11%|# | 10/95 [00:06<00:56, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9341, LAS: 0.8794, UEM: 0.5481, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6209, loss: 0.8274, batch_reg_loss: 0.1447, reg_loss: 0.1446 ||: 14%|#3 | 13/95 [00:09<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9374, LAS: 0.8833, UEM: 0.5741, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.7962, batch_reg_loss: 0.1448, reg_loss: 0.1446 ||: 17%|#6 | 16/95 [00:11<01:00, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9353, LAS: 0.8816, UEM: 0.5744, LEM: 0.3010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7819, partial_loss/deprel_loss: 0.7879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9315, loss: 0.8111, batch_reg_loss: 0.1448, reg_loss: 0.1446 ||: 20%|## | 19/95 [00:14<00:58, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9337, LAS: 0.8794, UEM: 0.5620, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0534, partial_loss/deprel_loss: 0.9259, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0962, loss: 0.8336, batch_reg_loss: 0.1449, reg_loss: 0.1447 ||: 23%|##3 | 22/95 [00:16<00:54, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9366, LAS: 0.8828, UEM: 0.5983, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4925, loss: 0.8100, batch_reg_loss: 0.1449, reg_loss: 0.1447 ||: 26%|##6 | 25/95 [00:18<00:53, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8514, UAS: 0.9354, LAS: 0.8810, UEM: 0.5727, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 0.8764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0185, loss: 0.8204, batch_reg_loss: 0.1450, reg_loss: 0.1447 ||: 31%|### | 29/95 [00:21<00:47, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9376, LAS: 0.8837, UEM: 0.5951, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1037, partial_loss/deprel_loss: 0.2590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3730, loss: 0.7973, batch_reg_loss: 0.1451, reg_loss: 0.1448 ||: 35%|###4 | 33/95 [00:23<00:44, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8823, UAS: 0.9367, LAS: 0.8824, UEM: 0.5756, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6670, partial_loss/deprel_loss: 0.6741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.8089, batch_reg_loss: 0.1451, reg_loss: 0.1448 ||: 38%|###7 | 36/95 [00:25<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9375, LAS: 0.8833, UEM: 0.5715, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.8022, batch_reg_loss: 0.1452, reg_loss: 0.1448 ||: 41%|####1 | 39/95 [00:27<00:39, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9368, LAS: 0.8828, UEM: 0.5804, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4304, loss: 0.8037, batch_reg_loss: 0.1452, reg_loss: 0.1449 ||: 44%|####4 | 42/95 [00:30<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9351, LAS: 0.8807, UEM: 0.5662, LEM: 0.3249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5921, partial_loss/deprel_loss: 0.7327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8499, loss: 0.8204, batch_reg_loss: 0.1453, reg_loss: 0.1449 ||: 47%|####7 | 45/95 [00:32<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9360, LAS: 0.8817, UEM: 0.5692, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4875, partial_loss/deprel_loss: 0.6497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7626, loss: 0.8124, batch_reg_loss: 0.1453, reg_loss: 0.1449 ||: 51%|##### | 48/95 [00:34<00:33, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9346, LAS: 0.8800, UEM: 0.5626, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2597, partial_loss/deprel_loss: 0.4557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.8267, batch_reg_loss: 0.1454, reg_loss: 0.1449 ||: 55%|#####4 | 52/95 [00:37<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9348, LAS: 0.8800, UEM: 0.5570, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8865, partial_loss/deprel_loss: 0.8319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9883, loss: 0.8266, batch_reg_loss: 0.1455, reg_loss: 0.1450 ||: 58%|#####7 | 55/95 [00:39<00:28, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9349, LAS: 0.8801, UEM: 0.5596, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3515, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6537, loss: 0.8267, batch_reg_loss: 0.1455, reg_loss: 0.1450 ||: 61%|######1 | 58/95 [00:41<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9346, LAS: 0.8797, UEM: 0.5508, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0865, partial_loss/deprel_loss: 0.9012, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.8320, batch_reg_loss: 0.1456, reg_loss: 0.1450 ||: 65%|######5 | 62/95 [00:43<00:22, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9355, LAS: 0.8809, UEM: 0.5603, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.8214, batch_reg_loss: 0.1457, reg_loss: 0.1451 ||: 69%|######9 | 66/95 [00:46<00:19, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9361, LAS: 0.8818, UEM: 0.5629, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7719, partial_loss/deprel_loss: 0.7586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9070, loss: 0.8146, batch_reg_loss: 0.1458, reg_loss: 0.1451 ||: 74%|#######3 | 70/95 [00:49<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9361, LAS: 0.8819, UEM: 0.5576, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4729, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7050, loss: 0.8139, batch_reg_loss: 0.1458, reg_loss: 0.1452 ||: 78%|#######7 | 74/95 [00:51<00:13, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8327, UAS: 0.9368, LAS: 0.8829, UEM: 0.5771, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1562, partial_loss/deprel_loss: 1.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1986, loss: 0.8075, batch_reg_loss: 0.1459, reg_loss: 0.1452 ||: 82%|########2 | 78/95 [00:54<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9364, LAS: 0.8823, UEM: 0.5720, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4516, partial_loss/deprel_loss: 1.0691, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2915, loss: 0.8112, batch_reg_loss: 0.1459, reg_loss: 0.1452 ||: 86%|########6 | 82/95 [00:57<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9366, LAS: 0.8825, UEM: 0.5678, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.6596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7750, loss: 0.8109, batch_reg_loss: 0.1460, reg_loss: 0.1452 ||: 89%|########9 | 85/95 [00:59<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9374, LAS: 0.8832, UEM: 0.5746, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1837, partial_loss/deprel_loss: 0.3435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4576, loss: 0.8052, batch_reg_loss: 0.1460, reg_loss: 0.1453 ||: 93%|#########2| 88/95 [01:01<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9378, LAS: 0.8836, UEM: 0.5769, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7352, partial_loss/deprel_loss: 0.9154, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0254, loss: 0.8025, batch_reg_loss: 0.1461, reg_loss: 0.1453 ||: 96%|#########5| 91/95 [01:03<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9377, LAS: 0.8833, UEM: 0.5734, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.7708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.8052, batch_reg_loss: 0.1462, reg_loss: 0.1453 ||: 100%|##########| 95/95 [01:06<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9377, LAS: 0.8833, UEM: 0.5734, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.7708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.8052, batch_reg_loss: 0.1462, reg_loss: 0.1453 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-06 23:47:06,372 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9566, LAS: 0.9018, UEM: 0.7797, LEM: 0.5207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4264, partial_loss/deprel_loss: 29.7159, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8580, loss: 25.5143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9567, LAS: 0.9029, UEM: 0.7585, LEM: 0.4904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8997, partial_loss/deprel_loss: 34.5766, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8412, loss: 24.5860, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9503, LAS: 0.8962, UEM: 0.6993, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9073, partial_loss/deprel_loss: 29.4189, partial_loss/cycle_loss: 0.0000, batch_loss: 23.7166, loss: 25.8269, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9473, LAS: 0.8931, UEM: 0.6718, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 28.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0143, loss: 27.0167, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9473, LAS: 0.8931, UEM: 0.6718, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 28.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0143, loss: 27.0167, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.10it/s]\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - reg_loss | 0.145 | 0.000\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - UEM | 0.573 | 0.672\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - LEM | 0.327 | 0.394\n", + "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EM | 0.868 | 0.922\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.732 | 0.310\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | 0.947\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.771 | 28.690\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - loss | 0.805 | 27.017\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - LAS | 0.883 | 0.893\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:47:16,342 - INFO - combo.training.trainer - Epoch duration: 0:01:16.400613\n", + "2023-04-06 23:47:16,342 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:38\n", + "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - Epoch 51/399\n", + "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:47:16,348 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9418, LAS: 0.8849, UEM: 0.3598, LEM: 0.1190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6567, partial_loss/deprel_loss: 0.7006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8380, loss: 0.7955, batch_reg_loss: 0.1462, reg_loss: 0.1462 ||: 3%|3 | 3/95 [00:02<01:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9489, LAS: 0.8934, UEM: 0.5391, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6343, loss: 0.7233, batch_reg_loss: 0.1463, reg_loss: 0.1462 ||: 6%|6 | 6/95 [00:04<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9484, LAS: 0.8927, UEM: 0.5886, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2742, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.7152, batch_reg_loss: 0.1463, reg_loss: 0.1462 ||: 9%|9 | 9/95 [00:06<01:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9482, LAS: 0.8929, UEM: 0.5899, LEM: 0.3152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5917, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8061, loss: 0.7116, batch_reg_loss: 0.1464, reg_loss: 0.1463 ||: 14%|#3 | 13/95 [00:09<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9425, LAS: 0.8861, UEM: 0.5435, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4471, partial_loss/deprel_loss: 0.5360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6646, loss: 0.7664, batch_reg_loss: 0.1464, reg_loss: 0.1463 ||: 18%|#7 | 17/95 [00:11<00:52, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9440, LAS: 0.8886, UEM: 0.5466, LEM: 0.2774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.4940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.7496, batch_reg_loss: 0.1465, reg_loss: 0.1463 ||: 22%|##2 | 21/95 [00:14<00:48, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9404, LAS: 0.8849, UEM: 0.5174, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0270, partial_loss/deprel_loss: 0.9598, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1198, loss: 0.7867, batch_reg_loss: 0.1465, reg_loss: 0.1464 ||: 25%|##5 | 24/95 [00:16<00:47, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9391, LAS: 0.8837, UEM: 0.5188, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2842, partial_loss/deprel_loss: 0.4099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5314, loss: 0.7961, batch_reg_loss: 0.1466, reg_loss: 0.1464 ||: 28%|##8 | 27/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9409, LAS: 0.8856, UEM: 0.5292, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5539, loss: 0.7793, batch_reg_loss: 0.1467, reg_loss: 0.1464 ||: 33%|###2 | 31/95 [00:20<00:42, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9418, LAS: 0.8865, UEM: 0.5381, LEM: 0.2730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2403, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.7741, batch_reg_loss: 0.1467, reg_loss: 0.1464 ||: 36%|###5 | 34/95 [00:23<00:41, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9413, LAS: 0.8859, UEM: 0.5288, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4709, partial_loss/deprel_loss: 0.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.7800, batch_reg_loss: 0.1468, reg_loss: 0.1465 ||: 39%|###8 | 37/95 [00:25<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9425, LAS: 0.8874, UEM: 0.5445, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.7694, batch_reg_loss: 0.1469, reg_loss: 0.1465 ||: 43%|####3 | 41/95 [00:27<00:36, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9425, LAS: 0.8873, UEM: 0.5542, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7870, partial_loss/deprel_loss: 0.7960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9411, loss: 0.7686, batch_reg_loss: 0.1469, reg_loss: 0.1465 ||: 46%|####6 | 44/95 [00:30<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9432, LAS: 0.8885, UEM: 0.5694, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4448, loss: 0.7603, batch_reg_loss: 0.1470, reg_loss: 0.1466 ||: 49%|####9 | 47/95 [00:32<00:34, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9404, LAS: 0.8856, UEM: 0.5516, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1840, partial_loss/deprel_loss: 0.8997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1035, loss: 0.7850, batch_reg_loss: 0.1470, reg_loss: 0.1466 ||: 54%|#####3 | 51/95 [00:34<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9406, LAS: 0.8859, UEM: 0.5674, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9788, partial_loss/deprel_loss: 0.9509, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1035, loss: 0.7812, batch_reg_loss: 0.1471, reg_loss: 0.1466 ||: 57%|#####6 | 54/95 [00:36<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9391, LAS: 0.8844, UEM: 0.5723, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2408, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.7934, batch_reg_loss: 0.1471, reg_loss: 0.1467 ||: 61%|######1 | 58/95 [00:39<00:24, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9380, LAS: 0.8832, UEM: 0.5718, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1437, partial_loss/deprel_loss: 1.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5997, loss: 0.8041, batch_reg_loss: 0.1472, reg_loss: 0.1467 ||: 65%|######5 | 62/95 [00:42<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9389, LAS: 0.8846, UEM: 0.5914, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7249, partial_loss/deprel_loss: 0.7364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8814, loss: 0.7952, batch_reg_loss: 0.1473, reg_loss: 0.1467 ||: 68%|######8 | 65/95 [00:44<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9377, LAS: 0.8832, UEM: 0.5912, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.8055, batch_reg_loss: 0.1473, reg_loss: 0.1467 ||: 73%|#######2 | 69/95 [00:47<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9380, LAS: 0.8834, UEM: 0.5869, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5853, partial_loss/deprel_loss: 0.6372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 0.8042, batch_reg_loss: 0.1474, reg_loss: 0.1468 ||: 76%|#######5 | 72/95 [00:49<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8181, UAS: 0.9366, LAS: 0.8817, UEM: 0.5751, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4094, partial_loss/deprel_loss: 0.9917, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2227, loss: 0.8158, batch_reg_loss: 0.1475, reg_loss: 0.1468 ||: 80%|######## | 76/95 [00:51<00:12, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9358, LAS: 0.8808, UEM: 0.5683, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1003, loss: 0.8236, batch_reg_loss: 0.1476, reg_loss: 0.1468 ||: 84%|########4 | 80/95 [00:53<00:09, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9358, LAS: 0.8808, UEM: 0.5622, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3467, partial_loss/deprel_loss: 0.5521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6587, loss: 0.8243, batch_reg_loss: 0.1476, reg_loss: 0.1469 ||: 88%|########8 | 84/95 [00:56<00:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9364, LAS: 0.8813, UEM: 0.5618, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5633, partial_loss/deprel_loss: 0.7083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8270, loss: 0.8204, batch_reg_loss: 0.1477, reg_loss: 0.1469 ||: 93%|#########2| 88/95 [00:59<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9373, LAS: 0.8825, UEM: 0.5713, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.5724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.8121, batch_reg_loss: 0.1478, reg_loss: 0.1469 ||: 96%|#########5| 91/95 [01:02<00:02, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9378, LAS: 0.8829, UEM: 0.5731, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.8094, batch_reg_loss: 0.1479, reg_loss: 0.1470 ||: 100%|##########| 95/95 [01:04<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9378, LAS: 0.8829, UEM: 0.5731, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.8094, batch_reg_loss: 0.1479, reg_loss: 0.1470 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - reg_loss | 0.147 | N/A\n", + "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UEM | 0.573 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LEM | 0.328 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - EM | 0.912 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.289 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.475 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - loss | 0.809 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LAS | 0.883 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:21,161 - INFO - combo.training.trainer - Epoch duration: 0:01:04.818947\n", + "2023-04-06 23:48:21,161 - INFO - combo.training.trainer - Estimated training time remaining: 6:33:10\n", + "2023-04-06 23:48:21,161 - INFO - allennlp.training.trainer - Epoch 52/399\n", + "2023-04-06 23:48:21,161 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:48:21,162 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:48:21,167 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9308, LAS: 0.8799, UEM: 0.6359, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1617, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4247, loss: 0.8042, batch_reg_loss: 0.1479, reg_loss: 0.1479 ||: 3%|3 | 3/95 [00:02<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9420, LAS: 0.8884, UEM: 0.6471, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1579, partial_loss/deprel_loss: 0.4190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.7566, batch_reg_loss: 0.1480, reg_loss: 0.1479 ||: 7%|7 | 7/95 [00:04<01:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9364, LAS: 0.8820, UEM: 0.5961, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1484, partial_loss/deprel_loss: 1.0143, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1891, loss: 0.8171, batch_reg_loss: 0.1480, reg_loss: 0.1480 ||: 11%|# | 10/95 [00:06<01:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9336, LAS: 0.8782, UEM: 0.5276, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7180, partial_loss/deprel_loss: 0.7570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8447, batch_reg_loss: 0.1481, reg_loss: 0.1480 ||: 15%|#4 | 14/95 [00:09<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9357, LAS: 0.8806, UEM: 0.5214, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6777, partial_loss/deprel_loss: 0.8299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9476, loss: 0.8326, batch_reg_loss: 0.1481, reg_loss: 0.1480 ||: 18%|#7 | 17/95 [00:11<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9371, LAS: 0.8815, UEM: 0.5317, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3349, partial_loss/deprel_loss: 0.5308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6398, loss: 0.8226, batch_reg_loss: 0.1482, reg_loss: 0.1480 ||: 22%|##2 | 21/95 [00:13<00:49, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9336, LAS: 0.8785, UEM: 0.5080, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 0.9645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1249, loss: 0.8501, batch_reg_loss: 0.1483, reg_loss: 0.1481 ||: 26%|##6 | 25/95 [00:16<00:46, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9349, LAS: 0.8800, UEM: 0.5150, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.4210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.8417, batch_reg_loss: 0.1483, reg_loss: 0.1481 ||: 29%|##9 | 28/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9358, LAS: 0.8812, UEM: 0.5436, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5508, loss: 0.8294, batch_reg_loss: 0.1484, reg_loss: 0.1481 ||: 33%|###2 | 31/95 [00:21<00:47, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9358, LAS: 0.8813, UEM: 0.5378, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7045, loss: 0.8295, batch_reg_loss: 0.1485, reg_loss: 0.1482 ||: 37%|###6 | 35/95 [00:24<00:43, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9380, LAS: 0.8842, UEM: 0.5699, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1450, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.8068, batch_reg_loss: 0.1485, reg_loss: 0.1482 ||: 41%|####1 | 39/95 [00:26<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7942, UAS: 0.9366, LAS: 0.8825, UEM: 0.5679, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9756, partial_loss/deprel_loss: 1.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5398, loss: 0.8189, batch_reg_loss: 0.1486, reg_loss: 0.1482 ||: 44%|####4 | 42/95 [00:29<00:38, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9361, LAS: 0.8820, UEM: 0.5585, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2940, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5767, loss: 0.8254, batch_reg_loss: 0.1487, reg_loss: 0.1483 ||: 48%|####8 | 46/95 [00:31<00:33, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9373, LAS: 0.8833, UEM: 0.5702, LEM: 0.3198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.6539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7603, loss: 0.8182, batch_reg_loss: 0.1487, reg_loss: 0.1483 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9373, LAS: 0.8831, UEM: 0.5623, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4181, partial_loss/deprel_loss: 0.6043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7158, loss: 0.8206, batch_reg_loss: 0.1488, reg_loss: 0.1483 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9375, LAS: 0.8832, UEM: 0.5650, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.8150, batch_reg_loss: 0.1488, reg_loss: 0.1483 ||: 59%|#####8 | 56/95 [00:38<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8324, UAS: 0.9381, LAS: 0.8839, UEM: 0.5715, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3018, partial_loss/deprel_loss: 1.0026, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2113, loss: 0.8112, batch_reg_loss: 0.1489, reg_loss: 0.1484 ||: 63%|######3 | 60/95 [00:40<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9374, LAS: 0.8830, UEM: 0.5618, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7262, partial_loss/deprel_loss: 0.7235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8730, loss: 0.8165, batch_reg_loss: 0.1489, reg_loss: 0.1484 ||: 66%|######6 | 63/95 [00:42<00:21, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9382, LAS: 0.8840, UEM: 0.5622, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4737, partial_loss/deprel_loss: 0.6175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7378, loss: 0.8098, batch_reg_loss: 0.1490, reg_loss: 0.1484 ||: 69%|######9 | 66/95 [00:44<00:19, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8108, UAS: 0.9377, LAS: 0.8833, UEM: 0.5594, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4983, partial_loss/deprel_loss: 1.1986, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4076, loss: 0.8166, batch_reg_loss: 0.1490, reg_loss: 0.1485 ||: 73%|#######2 | 69/95 [00:47<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9378, LAS: 0.8833, UEM: 0.5587, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3065, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.8146, batch_reg_loss: 0.1491, reg_loss: 0.1485 ||: 76%|#######5 | 72/95 [00:49<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9391, LAS: 0.8849, UEM: 0.5869, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.8003, batch_reg_loss: 0.1491, reg_loss: 0.1485 ||: 79%|#######8 | 75/95 [00:52<00:15, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9391, LAS: 0.8849, UEM: 0.5810, LEM: 0.3327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.7175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8468, loss: 0.7992, batch_reg_loss: 0.1492, reg_loss: 0.1485 ||: 83%|########3 | 79/95 [00:54<00:11, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9390, LAS: 0.8849, UEM: 0.5754, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6301, partial_loss/deprel_loss: 0.7038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8383, loss: 0.7999, batch_reg_loss: 0.1492, reg_loss: 0.1486 ||: 86%|########6 | 82/95 [00:56<00:09, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9389, LAS: 0.8847, UEM: 0.5671, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.7119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8197, loss: 0.8009, batch_reg_loss: 0.1493, reg_loss: 0.1486 ||: 91%|######### | 86/95 [00:59<00:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9396, LAS: 0.8856, UEM: 0.5762, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1137, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4263, loss: 0.7948, batch_reg_loss: 0.1494, reg_loss: 0.1486 ||: 95%|#########4| 90/95 [01:02<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9392, LAS: 0.8851, UEM: 0.5773, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3726, partial_loss/deprel_loss: 0.5450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.7989, batch_reg_loss: 0.1494, reg_loss: 0.1487 ||: 98%|#########7| 93/95 [01:04<00:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8315, UAS: 0.9387, LAS: 0.8846, UEM: 0.5744, LEM: 0.3280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2811, partial_loss/deprel_loss: 0.9185, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1404, loss: 0.8018, batch_reg_loss: 0.1495, reg_loss: 0.1487 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - reg_loss | 0.149 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - UEM | 0.574 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - LEM | 0.328 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EM | 0.832 | N/A\n", + "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.281 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.918 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - LAS | 0.885 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:49:26,973 - INFO - combo.training.trainer - Epoch duration: 0:01:05.811734\n", + "2023-04-06 23:49:26,973 - INFO - combo.training.trainer - Estimated training time remaining: 6:31:49\n", + "2023-04-06 23:49:26,973 - INFO - allennlp.training.trainer - Epoch 53/399\n", + "2023-04-06 23:49:26,973 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:49:26,974 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:49:26,980 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9074, LAS: 0.8516, UEM: 0.2768, LEM: 0.1176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2356, partial_loss/deprel_loss: 0.9544, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1601, loss: 1.0297, batch_reg_loss: 0.1495, reg_loss: 0.1495 ||: 3%|3 | 3/95 [00:02<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9332, LAS: 0.8793, UEM: 0.6292, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3958, partial_loss/deprel_loss: 0.5297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6525, loss: 0.8124, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||: 6%|6 | 6/95 [00:04<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9334, LAS: 0.8799, UEM: 0.5389, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.8171, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||: 11%|# | 10/95 [00:06<00:56, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9385, LAS: 0.8856, UEM: 0.5737, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4720, loss: 0.7805, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||: 14%|#3 | 13/95 [00:08<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8637, UAS: 0.9397, LAS: 0.8870, UEM: 0.5782, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9353, partial_loss/deprel_loss: 0.8215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9940, loss: 0.7734, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||: 17%|#6 | 16/95 [00:10<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9376, LAS: 0.8846, UEM: 0.5705, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3460, partial_loss/deprel_loss: 1.0317, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2443, loss: 0.7951, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||: 21%|##1 | 20/95 [00:13<00:50, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9387, LAS: 0.8857, UEM: 0.5541, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5471, partial_loss/deprel_loss: 0.7203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8355, loss: 0.7887, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||: 24%|##4 | 23/95 [00:15<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9406, LAS: 0.8880, UEM: 0.5694, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6971, partial_loss/deprel_loss: 0.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.7714, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||: 27%|##7 | 26/95 [00:17<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9401, LAS: 0.8875, UEM: 0.5800, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8850, partial_loss/deprel_loss: 0.8165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9802, loss: 0.7746, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||: 31%|### | 29/95 [00:19<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9407, LAS: 0.8880, UEM: 0.5727, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4124, partial_loss/deprel_loss: 0.5812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6975, loss: 0.7700, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||: 34%|###3 | 32/95 [00:21<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9424, LAS: 0.8896, UEM: 0.5849, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3894, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.7588, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||: 37%|###6 | 35/95 [00:24<00:45, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9401, LAS: 0.8871, UEM: 0.5659, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6715, partial_loss/deprel_loss: 0.7216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.7798, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||: 40%|#### | 38/95 [00:26<00:42, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9402, LAS: 0.8874, UEM: 0.5589, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2362, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.7810, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||: 44%|####4 | 42/95 [00:29<00:37, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9405, LAS: 0.8873, UEM: 0.5617, LEM: 0.3126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9249, partial_loss/deprel_loss: 0.8992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0545, loss: 0.7805, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||: 47%|####7 | 45/95 [00:31<00:35, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9401, LAS: 0.8867, UEM: 0.5562, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.3797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5050, loss: 0.7841, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||: 52%|#####1 | 49/95 [00:34<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9389, LAS: 0.8857, UEM: 0.5537, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2715, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.7928, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9378, LAS: 0.8848, UEM: 0.5472, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7601, partial_loss/deprel_loss: 1.0152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3145, loss: 0.8008, batch_reg_loss: 0.1504, reg_loss: 0.1499 ||: 58%|#####7 | 55/95 [00:38<00:28, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9370, LAS: 0.8838, UEM: 0.5553, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2572, partial_loss/deprel_loss: 0.4285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5446, loss: 0.8078, batch_reg_loss: 0.1504, reg_loss: 0.1500 ||: 61%|######1 | 58/95 [00:40<00:26, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9364, LAS: 0.8831, UEM: 0.5463, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4287, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.8138, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||: 65%|######5 | 62/95 [00:42<00:22, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9364, LAS: 0.8830, UEM: 0.5485, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2064, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.8177, batch_reg_loss: 0.1506, reg_loss: 0.1500 ||: 69%|######9 | 66/95 [00:45<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9381, LAS: 0.8851, UEM: 0.5775, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3076, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.8029, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||: 74%|#######3 | 70/95 [00:48<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9380, LAS: 0.8847, UEM: 0.5696, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5853, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8619, loss: 0.8040, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||: 78%|#######7 | 74/95 [00:50<00:13, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9385, LAS: 0.8852, UEM: 0.5755, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7588, partial_loss/deprel_loss: 0.7845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9302, loss: 0.7990, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||: 82%|########2 | 78/95 [00:53<00:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9397, LAS: 0.8864, UEM: 0.5853, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.7898, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||: 86%|########6 | 82/95 [00:55<00:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9392, LAS: 0.8857, UEM: 0.5788, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7710, partial_loss/deprel_loss: 0.8137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9561, loss: 0.7949, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||: 91%|######### | 86/95 [00:58<00:05, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9395, LAS: 0.8860, UEM: 0.5767, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3494, partial_loss/deprel_loss: 0.5346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6486, loss: 0.7926, batch_reg_loss: 0.1510, reg_loss: 0.1502 ||: 95%|#########4| 90/95 [01:00<00:03, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9386, LAS: 0.8847, UEM: 0.5728, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8984, partial_loss/deprel_loss: 0.8506, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0112, loss: 0.8005, batch_reg_loss: 0.1511, reg_loss: 0.1503 ||: 99%|#########8| 94/95 [01:03<00:00, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9382, LAS: 0.8843, UEM: 0.5700, LEM: 0.3266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0352, partial_loss/deprel_loss: 0.9346, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1058, loss: 0.8037, batch_reg_loss: 0.1511, reg_loss: 0.1503 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-06 23:50:30,698 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - reg_loss | 0.150 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UEM | 0.570 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - LEM | 0.327 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EM | 0.841 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.035 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.935 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - loss | 0.804 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - LAS | 0.884 | N/A\n", + "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:50:30,700 - INFO - combo.training.trainer - Epoch duration: 0:01:03.727272\n", + "2023-04-06 23:50:30,701 - INFO - combo.training.trainer - Estimated training time remaining: 6:30:15\n", + "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - Epoch 54/399\n", + "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:50:30,708 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9432, LAS: 0.8912, UEM: 0.4653, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3018, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6229, loss: 0.7230, batch_reg_loss: 0.1512, reg_loss: 0.1511 ||: 4%|4 | 4/95 [00:02<00:53, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9407, LAS: 0.8860, UEM: 0.4340, LEM: 0.1799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5516, partial_loss/deprel_loss: 0.6807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8061, loss: 0.7673, batch_reg_loss: 0.1512, reg_loss: 0.1512 ||: 7%|7 | 7/95 [00:04<00:55, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9446, LAS: 0.8911, UEM: 0.5261, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.7591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.7372, batch_reg_loss: 0.1513, reg_loss: 0.1512 ||: 11%|# | 10/95 [00:06<00:56, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8014, UAS: 0.9321, LAS: 0.8777, UEM: 0.4638, LEM: 0.2215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7332, partial_loss/deprel_loss: 1.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4221, loss: 0.8509, batch_reg_loss: 0.1513, reg_loss: 0.1512 ||: 15%|#4 | 14/95 [00:09<00:54, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9389, LAS: 0.8856, UEM: 0.5889, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1185, partial_loss/deprel_loss: 0.2801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3991, loss: 0.7908, batch_reg_loss: 0.1514, reg_loss: 0.1512 ||: 18%|#7 | 17/95 [00:11<00:54, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9422, LAS: 0.8906, UEM: 0.6494, LEM: 0.4311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8040, partial_loss/deprel_loss: 0.8287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9752, loss: 0.7633, batch_reg_loss: 0.1514, reg_loss: 0.1513 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9409, LAS: 0.8893, UEM: 0.6266, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0245, partial_loss/deprel_loss: 0.9164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0895, loss: 0.7669, batch_reg_loss: 0.1515, reg_loss: 0.1513 ||: 25%|##5 | 24/95 [00:16<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9400, LAS: 0.8877, UEM: 0.6214, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 0.4560, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5609, loss: 0.7795, batch_reg_loss: 0.1516, reg_loss: 0.1513 ||: 28%|##8 | 27/95 [00:18<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9423, LAS: 0.8900, UEM: 0.6320, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 0.7602, batch_reg_loss: 0.1516, reg_loss: 0.1514 ||: 32%|###1 | 30/95 [00:20<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9402, LAS: 0.8870, UEM: 0.6083, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5305, partial_loss/deprel_loss: 0.6831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8043, loss: 0.7803, batch_reg_loss: 0.1517, reg_loss: 0.1514 ||: 36%|###5 | 34/95 [00:23<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9400, LAS: 0.8864, UEM: 0.5986, LEM: 0.3629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.5330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6429, loss: 0.7899, batch_reg_loss: 0.1517, reg_loss: 0.1514 ||: 40%|#### | 38/95 [00:25<00:36, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9409, LAS: 0.8871, UEM: 0.6169, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0997, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4227, loss: 0.7853, batch_reg_loss: 0.1518, reg_loss: 0.1515 ||: 44%|####4 | 42/95 [00:29<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9413, LAS: 0.8877, UEM: 0.6130, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9848, partial_loss/deprel_loss: 0.9332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0954, loss: 0.7816, batch_reg_loss: 0.1519, reg_loss: 0.1515 ||: 48%|####8 | 46/95 [00:31<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9406, LAS: 0.8871, UEM: 0.6170, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5783, loss: 0.7857, batch_reg_loss: 0.1520, reg_loss: 0.1515 ||: 53%|#####2 | 50/95 [00:34<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9409, LAS: 0.8871, UEM: 0.6076, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5270, partial_loss/deprel_loss: 0.6130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.7860, batch_reg_loss: 0.1520, reg_loss: 0.1516 ||: 56%|#####5 | 53/95 [00:36<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9395, LAS: 0.8854, UEM: 0.6006, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4682, partial_loss/deprel_loss: 0.6048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7295, loss: 0.7997, batch_reg_loss: 0.1521, reg_loss: 0.1516 ||: 60%|###### | 57/95 [00:38<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9390, LAS: 0.8849, UEM: 0.5891, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6837, partial_loss/deprel_loss: 0.6771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8306, loss: 0.8014, batch_reg_loss: 0.1521, reg_loss: 0.1516 ||: 64%|######4 | 61/95 [00:41<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9387, LAS: 0.8846, UEM: 0.5810, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0663, partial_loss/deprel_loss: 0.8890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0767, loss: 0.8040, batch_reg_loss: 0.1522, reg_loss: 0.1517 ||: 68%|######8 | 65/95 [00:43<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9382, LAS: 0.8842, UEM: 0.5700, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.7114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.8082, batch_reg_loss: 0.1523, reg_loss: 0.1517 ||: 73%|#######2 | 69/95 [00:46<00:16, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9388, LAS: 0.8849, UEM: 0.5726, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2094, partial_loss/deprel_loss: 0.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5182, loss: 0.8035, batch_reg_loss: 0.1523, reg_loss: 0.1517 ||: 77%|#######6 | 73/95 [00:48<00:13, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9375, LAS: 0.8835, UEM: 0.5630, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4102, partial_loss/deprel_loss: 0.9987, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2334, loss: 0.8147, batch_reg_loss: 0.1524, reg_loss: 0.1518 ||: 81%|########1 | 77/95 [00:50<00:10, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9382, LAS: 0.8841, UEM: 0.5651, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2742, partial_loss/deprel_loss: 0.4569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5728, loss: 0.8095, batch_reg_loss: 0.1525, reg_loss: 0.1518 ||: 85%|########5 | 81/95 [00:53<00:08, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9380, LAS: 0.8841, UEM: 0.5726, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6431, partial_loss/deprel_loss: 0.7291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8645, loss: 0.8083, batch_reg_loss: 0.1526, reg_loss: 0.1518 ||: 89%|########9 | 85/95 [00:56<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8391, UAS: 0.9384, LAS: 0.8845, UEM: 0.5755, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1240, partial_loss/deprel_loss: 0.8925, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0915, loss: 0.8048, batch_reg_loss: 0.1526, reg_loss: 0.1519 ||: 94%|#########3| 89/95 [00:59<00:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9386, LAS: 0.8847, UEM: 0.5751, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5276, partial_loss/deprel_loss: 0.6364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.8045, batch_reg_loss: 0.1527, reg_loss: 0.1519 ||: 98%|#########7| 93/95 [01:02<00:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9384, LAS: 0.8844, UEM: 0.5714, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5570, partial_loss/deprel_loss: 0.7028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8264, loss: 0.8055, batch_reg_loss: 0.1527, reg_loss: 0.1519 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - reg_loss | 0.152 | N/A\n", + "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UEM | 0.571 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LEM | 0.328 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - EM | 0.880 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.557 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.703 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - loss | 0.806 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LAS | 0.884 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,585 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,585 - INFO - combo.training.trainer - Epoch duration: 0:01:03.884523\n", + "2023-04-06 23:51:34,585 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:44\n", + "2023-04-06 23:51:34,585 - INFO - allennlp.training.trainer - Epoch 55/399\n", + "2023-04-06 23:51:34,586 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:51:34,586 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:51:34,592 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9246, LAS: 0.8702, UEM: 0.4162, LEM: 0.1844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7076, partial_loss/deprel_loss: 0.7673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9081, loss: 0.9192, batch_reg_loss: 0.1528, reg_loss: 0.1528 ||: 3%|3 | 3/95 [00:02<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9409, LAS: 0.8876, UEM: 0.6300, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3062, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.7514, batch_reg_loss: 0.1528, reg_loss: 0.1528 ||: 6%|6 | 6/95 [00:04<01:11, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9288, LAS: 0.8742, UEM: 0.5475, LEM: 0.3031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2014, partial_loss/deprel_loss: 0.9325, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1391, loss: 0.8618, batch_reg_loss: 0.1529, reg_loss: 0.1528 ||: 9%|9 | 9/95 [00:07<01:06, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9283, LAS: 0.8745, UEM: 0.5024, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4370, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6525, loss: 0.8605, batch_reg_loss: 0.1530, reg_loss: 0.1529 ||: 14%|#3 | 13/95 [00:09<01:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9333, LAS: 0.8803, UEM: 0.5678, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2531, partial_loss/deprel_loss: 0.4340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5508, loss: 0.8142, batch_reg_loss: 0.1530, reg_loss: 0.1529 ||: 17%|#6 | 16/95 [00:12<01:00, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9314, LAS: 0.8772, UEM: 0.5379, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5511, partial_loss/deprel_loss: 0.6187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7583, loss: 0.8362, batch_reg_loss: 0.1531, reg_loss: 0.1529 ||: 21%|##1 | 20/95 [00:14<00:54, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9366, LAS: 0.8835, UEM: 0.6102, LEM: 0.3794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0675, partial_loss/deprel_loss: 0.1877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3168, loss: 0.7936, batch_reg_loss: 0.1531, reg_loss: 0.1529 ||: 25%|##5 | 24/95 [00:17<00:52, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9365, LAS: 0.8834, UEM: 0.5995, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.4303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5477, loss: 0.8045, batch_reg_loss: 0.1532, reg_loss: 0.1530 ||: 29%|##9 | 28/95 [00:20<00:47, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9370, LAS: 0.8837, UEM: 0.5871, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6924, partial_loss/deprel_loss: 0.7964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9289, loss: 0.8024, batch_reg_loss: 0.1533, reg_loss: 0.1530 ||: 33%|###2 | 31/95 [00:22<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9347, LAS: 0.8810, UEM: 0.5645, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7922, loss: 0.8214, batch_reg_loss: 0.1533, reg_loss: 0.1530 ||: 37%|###6 | 35/95 [00:25<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9353, LAS: 0.8816, UEM: 0.5658, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.8181, batch_reg_loss: 0.1534, reg_loss: 0.1531 ||: 40%|#### | 38/95 [00:27<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9350, LAS: 0.8809, UEM: 0.5577, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9163, partial_loss/deprel_loss: 0.8228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9950, loss: 0.8232, batch_reg_loss: 0.1535, reg_loss: 0.1531 ||: 44%|####4 | 42/95 [00:29<00:35, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9343, LAS: 0.8800, UEM: 0.5480, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.5582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6766, loss: 0.8292, batch_reg_loss: 0.1535, reg_loss: 0.1531 ||: 47%|####7 | 45/95 [00:31<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9360, LAS: 0.8817, UEM: 0.5640, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4991, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7727, loss: 0.8155, batch_reg_loss: 0.1536, reg_loss: 0.1532 ||: 51%|##### | 48/95 [00:33<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9372, LAS: 0.8833, UEM: 0.5737, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2591, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.8033, batch_reg_loss: 0.1536, reg_loss: 0.1532 ||: 54%|#####3 | 51/95 [00:35<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9379, LAS: 0.8836, UEM: 0.5688, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6107, partial_loss/deprel_loss: 0.7630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8862, loss: 0.8026, batch_reg_loss: 0.1537, reg_loss: 0.1532 ||: 58%|#####7 | 55/95 [00:38<00:26, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9386, LAS: 0.8845, UEM: 0.5654, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3918, partial_loss/deprel_loss: 0.5176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.7971, batch_reg_loss: 0.1538, reg_loss: 0.1533 ||: 62%|######2 | 59/95 [00:40<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9392, LAS: 0.8850, UEM: 0.5727, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4212, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.7926, batch_reg_loss: 0.1538, reg_loss: 0.1533 ||: 66%|######6 | 63/95 [00:43<00:20, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9371, LAS: 0.8827, UEM: 0.5671, LEM: 0.3200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8757, partial_loss/deprel_loss: 0.8471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0066, loss: 0.8118, batch_reg_loss: 0.1539, reg_loss: 0.1533 ||: 71%|####### | 67/95 [00:46<00:18, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9374, LAS: 0.8829, UEM: 0.5622, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.7673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8817, loss: 0.8103, batch_reg_loss: 0.1539, reg_loss: 0.1534 ||: 75%|#######4 | 71/95 [00:48<00:15, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8005, UAS: 0.9372, LAS: 0.8826, UEM: 0.5689, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8491, partial_loss/deprel_loss: 1.1676, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4579, loss: 0.8126, batch_reg_loss: 0.1540, reg_loss: 0.1534 ||: 79%|#######8 | 75/95 [00:51<00:13, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9367, LAS: 0.8821, UEM: 0.5602, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.8468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9780, loss: 0.8171, batch_reg_loss: 0.1541, reg_loss: 0.1534 ||: 83%|########3 | 79/95 [00:54<00:10, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9371, LAS: 0.8825, UEM: 0.5707, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1588, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4807, loss: 0.8144, batch_reg_loss: 0.1541, reg_loss: 0.1535 ||: 87%|########7 | 83/95 [00:57<00:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9373, LAS: 0.8828, UEM: 0.5761, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1189, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3788, loss: 0.8118, batch_reg_loss: 0.1542, reg_loss: 0.1535 ||: 92%|#########1| 87/95 [01:00<00:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9379, LAS: 0.8834, UEM: 0.5767, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2888, partial_loss/deprel_loss: 0.4539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5751, loss: 0.8068, batch_reg_loss: 0.1543, reg_loss: 0.1535 ||: 96%|#########5| 91/95 [01:02<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9380, LAS: 0.8835, UEM: 0.5754, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4507, partial_loss/deprel_loss: 0.6335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7513, loss: 0.8063, batch_reg_loss: 0.1543, reg_loss: 0.1535 ||: 99%|#########8| 94/95 [01:04<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9378, LAS: 0.8832, UEM: 0.5728, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0441, partial_loss/deprel_loss: 0.9468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1206, loss: 0.8096, batch_reg_loss: 0.1544, reg_loss: 0.1536 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:52:39,843 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9485, LAS: 0.8993, UEM: 0.6034, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 29.4420, partial_loss/cycle_loss: 0.0000, batch_loss: 23.7367, loss: 22.1813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9402, LAS: 0.8871, UEM: 0.5676, LEM: 0.2821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4387, partial_loss/deprel_loss: 59.0686, partial_loss/cycle_loss: 0.0000, batch_loss: 47.5426, loss: 28.3777, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9450, LAS: 0.8928, UEM: 0.6581, LEM: 0.4051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8604, partial_loss/deprel_loss: 34.5645, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8236, loss: 26.8009, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9466, LAS: 0.8934, UEM: 0.6662, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 29.6997, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8572, loss: 26.9928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9466, LAS: 0.8934, UEM: 0.6662, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 29.6997, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8572, loss: 26.9928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.06it/s]\n", + "2023-04-06 23:52:50,238 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - reg_loss | 0.154 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UEM | 0.573 | 0.666\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LEM | 0.326 | 0.397\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EM | 0.851 | 0.896\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.044 | 0.487\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | 0.947\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.947 | 29.700\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - loss | 0.810 | 26.993\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LAS | 0.883 | 0.893\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:52:50,240 - INFO - combo.training.trainer - Epoch duration: 0:01:15.654778\n", + "2023-04-06 23:52:50,240 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:26\n", + "2023-04-06 23:52:50,240 - INFO - allennlp.training.trainer - Epoch 56/399\n", + "2023-04-06 23:52:50,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:52:50,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:52:50,246 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8305, UAS: 0.9262, LAS: 0.8712, UEM: 0.3168, LEM: 0.0991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3721, partial_loss/deprel_loss: 0.9398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1807, loss: 0.8943, batch_reg_loss: 0.1544, reg_loss: 0.1544 ||: 4%|4 | 4/95 [00:02<00:52, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9322, LAS: 0.8770, UEM: 0.4235, LEM: 0.1870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 0.5488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6752, loss: 0.8571, batch_reg_loss: 0.1545, reg_loss: 0.1544 ||: 7%|7 | 7/95 [00:04<00:53, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9325, LAS: 0.8772, UEM: 0.4856, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6284, partial_loss/deprel_loss: 0.7571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8859, loss: 0.8623, batch_reg_loss: 0.1545, reg_loss: 0.1544 ||: 11%|# | 10/95 [00:06<00:55, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9383, LAS: 0.8840, UEM: 0.5598, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.4345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.8084, batch_reg_loss: 0.1546, reg_loss: 0.1545 ||: 14%|#3 | 13/95 [00:08<00:54, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9405, LAS: 0.8866, UEM: 0.5888, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7046, partial_loss/deprel_loss: 0.7288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8785, loss: 0.7837, batch_reg_loss: 0.1546, reg_loss: 0.1545 ||: 17%|#6 | 16/95 [00:10<00:52, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9426, LAS: 0.8891, UEM: 0.5805, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.5277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6480, loss: 0.7713, batch_reg_loss: 0.1547, reg_loss: 0.1545 ||: 21%|##1 | 20/95 [00:13<00:49, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9432, LAS: 0.8909, UEM: 0.6266, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5408, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.7608, batch_reg_loss: 0.1547, reg_loss: 0.1546 ||: 24%|##4 | 23/95 [00:15<00:49, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9439, LAS: 0.8914, UEM: 0.6181, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8244, partial_loss/deprel_loss: 0.7752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9398, loss: 0.7575, batch_reg_loss: 0.1548, reg_loss: 0.1546 ||: 28%|##8 | 27/95 [00:18<00:45, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9449, LAS: 0.8917, UEM: 0.6201, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6989, partial_loss/deprel_loss: 0.8017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9360, loss: 0.7524, batch_reg_loss: 0.1548, reg_loss: 0.1546 ||: 32%|###1 | 30/95 [00:20<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9442, LAS: 0.8912, UEM: 0.6167, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5697, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7294, loss: 0.7548, batch_reg_loss: 0.1549, reg_loss: 0.1546 ||: 36%|###5 | 34/95 [00:22<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9415, LAS: 0.8884, UEM: 0.6010, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 0.6103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7250, loss: 0.7745, batch_reg_loss: 0.1550, reg_loss: 0.1547 ||: 39%|###8 | 37/95 [00:24<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9407, LAS: 0.8875, UEM: 0.5969, LEM: 0.3615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3139, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5483, loss: 0.7804, batch_reg_loss: 0.1550, reg_loss: 0.1547 ||: 42%|####2 | 40/95 [00:27<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9415, LAS: 0.8882, UEM: 0.6005, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3625, partial_loss/deprel_loss: 0.5394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.7746, batch_reg_loss: 0.1551, reg_loss: 0.1547 ||: 45%|####5 | 43/95 [00:29<00:39, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9415, LAS: 0.8882, UEM: 0.5928, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.5092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6367, loss: 0.7747, batch_reg_loss: 0.1551, reg_loss: 0.1547 ||: 48%|####8 | 46/95 [00:31<00:36, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9408, LAS: 0.8876, UEM: 0.5904, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.6605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 0.7798, batch_reg_loss: 0.1552, reg_loss: 0.1548 ||: 52%|#####1 | 49/95 [00:34<00:33, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9415, LAS: 0.8884, UEM: 0.5918, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5655, loss: 0.7738, batch_reg_loss: 0.1552, reg_loss: 0.1548 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9396, LAS: 0.8862, UEM: 0.5763, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7964, partial_loss/deprel_loss: 0.7824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9405, loss: 0.7906, batch_reg_loss: 0.1553, reg_loss: 0.1548 ||: 59%|#####8 | 56/95 [00:38<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7874, UAS: 0.9390, LAS: 0.8856, UEM: 0.5793, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9541, partial_loss/deprel_loss: 1.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5254, loss: 0.7949, batch_reg_loss: 0.1553, reg_loss: 0.1549 ||: 63%|######3 | 60/95 [00:41<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7955, UAS: 0.9389, LAS: 0.8856, UEM: 0.5938, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5819, partial_loss/deprel_loss: 1.1667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4052, loss: 0.7929, batch_reg_loss: 0.1554, reg_loss: 0.1549 ||: 67%|######7 | 64/95 [00:43<00:20, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9391, LAS: 0.8859, UEM: 0.5976, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1142, partial_loss/deprel_loss: 0.3327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4445, loss: 0.7904, batch_reg_loss: 0.1555, reg_loss: 0.1549 ||: 72%|#######1 | 68/95 [00:46<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9399, LAS: 0.8865, UEM: 0.5956, LEM: 0.3551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5234, partial_loss/deprel_loss: 0.7011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8211, loss: 0.7863, batch_reg_loss: 0.1555, reg_loss: 0.1550 ||: 76%|#######5 | 72/95 [00:49<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9390, LAS: 0.8855, UEM: 0.5850, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 0.6956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8331, loss: 0.7931, batch_reg_loss: 0.1556, reg_loss: 0.1550 ||: 80%|######## | 76/95 [00:52<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9392, LAS: 0.8854, UEM: 0.5840, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0770, partial_loss/deprel_loss: 0.9281, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1136, loss: 0.7925, batch_reg_loss: 0.1557, reg_loss: 0.1550 ||: 84%|########4 | 80/95 [00:54<00:10, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9398, LAS: 0.8862, UEM: 0.5856, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4596, partial_loss/deprel_loss: 0.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7314, loss: 0.7873, batch_reg_loss: 0.1557, reg_loss: 0.1550 ||: 87%|########7 | 83/95 [00:56<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9392, LAS: 0.8855, UEM: 0.5793, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3229, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6098, loss: 0.7921, batch_reg_loss: 0.1558, reg_loss: 0.1551 ||: 92%|#########1| 87/95 [00:59<00:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9390, LAS: 0.8853, UEM: 0.5784, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7266, partial_loss/deprel_loss: 0.7919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9347, loss: 0.7935, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||: 95%|#########4| 90/95 [01:01<00:03, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9386, LAS: 0.8848, UEM: 0.5719, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8613, partial_loss/deprel_loss: 0.8771, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0299, loss: 0.7983, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||: 99%|#########8| 94/95 [01:04<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9382, LAS: 0.8843, UEM: 0.5696, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1757, partial_loss/deprel_loss: 0.9447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1468, loss: 0.8020, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - reg_loss | 0.155 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - UEM | 0.570 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - LEM | 0.329 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EM | 0.844 | N/A\n", + "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.176 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - UAS | 0.938 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.945 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - LAS | 0.884 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:53:55,305 - INFO - combo.training.trainer - Epoch duration: 0:01:05.064412\n", + "2023-04-06 23:53:55,305 - INFO - combo.training.trainer - Estimated training time remaining: 6:27:02\n", + "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - Epoch 57/399\n", + "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:53:55,311 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9514, LAS: 0.8998, UEM: 0.5685, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.6701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8141, loss: 0.6940, batch_reg_loss: 0.1560, reg_loss: 0.1560 ||: 3%|3 | 3/95 [00:02<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9429, LAS: 0.8933, UEM: 0.6418, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8174, partial_loss/deprel_loss: 0.6788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8626, loss: 0.7285, batch_reg_loss: 0.1560, reg_loss: 0.1560 ||: 6%|6 | 6/95 [00:04<01:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9323, LAS: 0.8814, UEM: 0.5794, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4063, partial_loss/deprel_loss: 0.4939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6324, loss: 0.8184, batch_reg_loss: 0.1561, reg_loss: 0.1560 ||: 9%|9 | 9/95 [00:06<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9295, LAS: 0.8768, UEM: 0.5295, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5860, partial_loss/deprel_loss: 0.6730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8118, loss: 0.8601, batch_reg_loss: 0.1562, reg_loss: 0.1561 ||: 14%|#3 | 13/95 [00:08<00:55, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9299, LAS: 0.8773, UEM: 0.5165, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2354, partial_loss/deprel_loss: 0.4117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5327, loss: 0.8636, batch_reg_loss: 0.1562, reg_loss: 0.1561 ||: 17%|#6 | 16/95 [00:10<00:53, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9312, LAS: 0.8786, UEM: 0.5149, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9326, partial_loss/deprel_loss: 0.7946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 0.8560, batch_reg_loss: 0.1563, reg_loss: 0.1561 ||: 21%|##1 | 20/95 [00:13<00:49, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9314, LAS: 0.8781, UEM: 0.4962, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9069, partial_loss/deprel_loss: 0.8206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9942, loss: 0.8563, batch_reg_loss: 0.1564, reg_loss: 0.1562 ||: 24%|##4 | 23/95 [00:15<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9310, LAS: 0.8775, UEM: 0.4864, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 0.7806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9451, loss: 0.8614, batch_reg_loss: 0.1564, reg_loss: 0.1562 ||: 27%|##7 | 26/95 [00:17<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9330, LAS: 0.8797, UEM: 0.4983, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3869, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.8448, batch_reg_loss: 0.1565, reg_loss: 0.1562 ||: 31%|### | 29/95 [00:19<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9360, LAS: 0.8833, UEM: 0.5451, LEM: 0.3109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5663, loss: 0.8185, batch_reg_loss: 0.1565, reg_loss: 0.1562 ||: 34%|###3 | 32/95 [00:21<00:44, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9353, LAS: 0.8824, UEM: 0.5308, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4447, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6102, loss: 0.8230, batch_reg_loss: 0.1566, reg_loss: 0.1563 ||: 38%|###7 | 36/95 [00:24<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9349, LAS: 0.8817, UEM: 0.5291, LEM: 0.2952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 0.7378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8886, loss: 0.8245, batch_reg_loss: 0.1566, reg_loss: 0.1563 ||: 41%|####1 | 39/95 [00:26<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9360, LAS: 0.8826, UEM: 0.5297, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.6143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7403, loss: 0.8194, batch_reg_loss: 0.1567, reg_loss: 0.1563 ||: 44%|####4 | 42/95 [00:28<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9374, LAS: 0.8840, UEM: 0.5491, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9230, partial_loss/deprel_loss: 0.8469, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0189, loss: 0.8084, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||: 48%|####8 | 46/95 [00:31<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9383, LAS: 0.8847, UEM: 0.5481, LEM: 0.2973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6985, loss: 0.8031, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||: 52%|#####1 | 49/95 [00:35<00:40, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9386, LAS: 0.8848, UEM: 0.5428, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.5208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.8013, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||: 55%|#####4 | 52/95 [00:37<00:35, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9132, UAS: 0.9388, LAS: 0.8851, UEM: 0.5479, LEM: 0.2955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2873, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.7988, batch_reg_loss: 0.1569, reg_loss: 0.1564 ||: 58%|#####7 | 55/95 [00:39<00:32, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9386, LAS: 0.8854, UEM: 0.5680, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0666, partial_loss/deprel_loss: 0.1669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3038, loss: 0.8006, batch_reg_loss: 0.1569, reg_loss: 0.1565 ||: 62%|######2 | 59/95 [00:42<00:28, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9386, LAS: 0.8854, UEM: 0.5663, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2632, partial_loss/deprel_loss: 0.4677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.7999, batch_reg_loss: 0.1570, reg_loss: 0.1565 ||: 65%|######5 | 62/95 [00:45<00:25, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9385, LAS: 0.8852, UEM: 0.5681, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.8015, batch_reg_loss: 0.1570, reg_loss: 0.1565 ||: 68%|######8 | 65/95 [00:47<00:23, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9393, LAS: 0.8861, UEM: 0.5810, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6600, partial_loss/deprel_loss: 0.7542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8925, loss: 0.7937, batch_reg_loss: 0.1571, reg_loss: 0.1565 ||: 72%|#######1 | 68/95 [00:49<00:20, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9401, LAS: 0.8870, UEM: 0.5895, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4321, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.7851, batch_reg_loss: 0.1571, reg_loss: 0.1566 ||: 75%|#######4 | 71/95 [00:51<00:18, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9406, LAS: 0.8876, UEM: 0.5927, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.7806, batch_reg_loss: 0.1572, reg_loss: 0.1566 ||: 78%|#######7 | 74/95 [00:53<00:15, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9402, LAS: 0.8869, UEM: 0.5958, LEM: 0.3471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.3719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4863, loss: 0.7857, batch_reg_loss: 0.1572, reg_loss: 0.1566 ||: 82%|########2 | 78/95 [00:56<00:12, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9400, LAS: 0.8867, UEM: 0.5954, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1439, partial_loss/deprel_loss: 0.3659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4787, loss: 0.7872, batch_reg_loss: 0.1573, reg_loss: 0.1566 ||: 85%|########5 | 81/95 [00:58<00:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9388, LAS: 0.8855, UEM: 0.5889, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7849, loss: 0.7964, batch_reg_loss: 0.1573, reg_loss: 0.1567 ||: 89%|########9 | 85/95 [01:01<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8431, UAS: 0.9382, LAS: 0.8849, UEM: 0.5850, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2189, partial_loss/deprel_loss: 0.9243, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1406, loss: 0.8010, batch_reg_loss: 0.1574, reg_loss: 0.1567 ||: 93%|#########2| 88/95 [01:03<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9382, LAS: 0.8847, UEM: 0.5793, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0566, partial_loss/deprel_loss: 0.9256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1092, loss: 0.8039, batch_reg_loss: 0.1574, reg_loss: 0.1567 ||: 97%|#########6| 92/95 [01:06<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9386, LAS: 0.8851, UEM: 0.5787, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9152, loss: 0.8015, batch_reg_loss: 0.1575, reg_loss: 0.1568 ||: 100%|##########| 95/95 [01:08<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9386, LAS: 0.8851, UEM: 0.5787, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9152, loss: 0.8015, batch_reg_loss: 0.1575, reg_loss: 0.1568 ||: 100%|##########| 95/95 [01:08<00:00, 1.39it/s]\n", + "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - reg_loss | 0.157 | N/A\n", + "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LEM | 0.331 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - EM | 0.872 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.797 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.748 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LAS | 0.885 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:03,588 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:03,588 - INFO - combo.training.trainer - Epoch duration: 0:01:08.283101\n", + "2023-04-06 23:55:03,588 - INFO - combo.training.trainer - Estimated training time remaining: 6:25:58\n", + "2023-04-06 23:55:03,588 - INFO - allennlp.training.trainer - Epoch 58/399\n", + "2023-04-06 23:55:03,588 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:55:03,589 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:55:03,595 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9535, LAS: 0.9048, UEM: 0.6764, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2934, partial_loss/deprel_loss: 0.4203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.6294, batch_reg_loss: 0.1576, reg_loss: 0.1575 ||: 4%|4 | 4/95 [00:02<00:57, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9500, LAS: 0.8997, UEM: 0.6510, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7014, partial_loss/deprel_loss: 0.7054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.6667, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||: 7%|7 | 7/95 [00:04<00:56, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9462, LAS: 0.8961, UEM: 0.7060, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0477, partial_loss/deprel_loss: 0.8501, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0473, loss: 0.7036, batch_reg_loss: 0.1577, reg_loss: 0.1576 ||: 11%|# | 10/95 [00:06<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9474, LAS: 0.8962, UEM: 0.6754, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6657, partial_loss/deprel_loss: 0.8229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9492, loss: 0.7093, batch_reg_loss: 0.1577, reg_loss: 0.1576 ||: 15%|#4 | 14/95 [00:09<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9421, LAS: 0.8899, UEM: 0.6545, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8990, partial_loss/deprel_loss: 0.8420, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0112, loss: 0.7615, batch_reg_loss: 0.1578, reg_loss: 0.1577 ||: 18%|#7 | 17/95 [00:11<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9386, LAS: 0.8864, UEM: 0.6129, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6553, partial_loss/deprel_loss: 0.6360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7977, loss: 0.7913, batch_reg_loss: 0.1579, reg_loss: 0.1577 ||: 22%|##2 | 21/95 [00:14<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9410, LAS: 0.8891, UEM: 0.6241, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.4281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.7703, batch_reg_loss: 0.1579, reg_loss: 0.1577 ||: 25%|##5 | 24/95 [00:16<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9409, LAS: 0.8887, UEM: 0.6214, LEM: 0.3859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4183, partial_loss/deprel_loss: 0.5498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6815, loss: 0.7742, batch_reg_loss: 0.1580, reg_loss: 0.1577 ||: 28%|##8 | 27/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9412, LAS: 0.8893, UEM: 0.6210, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3110, partial_loss/deprel_loss: 0.3967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5376, loss: 0.7676, batch_reg_loss: 0.1580, reg_loss: 0.1578 ||: 32%|###1 | 30/95 [00:20<00:48, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9412, LAS: 0.8894, UEM: 0.6169, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9132, partial_loss/deprel_loss: 0.8714, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0378, loss: 0.7685, batch_reg_loss: 0.1581, reg_loss: 0.1578 ||: 35%|###4 | 33/95 [00:23<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9429, LAS: 0.8910, UEM: 0.6139, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.5630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6840, loss: 0.7588, batch_reg_loss: 0.1581, reg_loss: 0.1578 ||: 39%|###8 | 37/95 [00:25<00:40, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9430, LAS: 0.8911, UEM: 0.6065, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2773, partial_loss/deprel_loss: 0.5158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6263, loss: 0.7592, batch_reg_loss: 0.1582, reg_loss: 0.1579 ||: 42%|####2 | 40/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9410, LAS: 0.8892, UEM: 0.6008, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4721, loss: 0.7747, batch_reg_loss: 0.1582, reg_loss: 0.1579 ||: 46%|####6 | 44/95 [00:30<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9413, LAS: 0.8894, UEM: 0.5904, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5840, partial_loss/deprel_loss: 0.6788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8182, loss: 0.7717, batch_reg_loss: 0.1583, reg_loss: 0.1579 ||: 51%|##### | 48/95 [00:32<00:31, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9409, LAS: 0.8889, UEM: 0.5887, LEM: 0.3417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.6978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8215, loss: 0.7760, batch_reg_loss: 0.1584, reg_loss: 0.1580 ||: 55%|#####4 | 52/95 [00:35<00:28, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9389, LAS: 0.8867, UEM: 0.5847, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2997, partial_loss/deprel_loss: 0.9815, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2036, loss: 0.7913, batch_reg_loss: 0.1584, reg_loss: 0.1580 ||: 59%|#####8 | 56/95 [00:38<00:26, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9382, LAS: 0.8857, UEM: 0.5789, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5541, loss: 0.8001, batch_reg_loss: 0.1585, reg_loss: 0.1580 ||: 63%|######3 | 60/95 [00:40<00:23, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9382, LAS: 0.8857, UEM: 0.5745, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7031, partial_loss/deprel_loss: 0.7636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9101, loss: 0.8013, batch_reg_loss: 0.1586, reg_loss: 0.1581 ||: 67%|######7 | 64/95 [00:43<00:21, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9375, LAS: 0.8849, UEM: 0.5662, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4286, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7073, loss: 0.8071, batch_reg_loss: 0.1587, reg_loss: 0.1581 ||: 72%|#######1 | 68/95 [00:46<00:17, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9377, LAS: 0.8849, UEM: 0.5654, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.8082, batch_reg_loss: 0.1587, reg_loss: 0.1581 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9376, LAS: 0.8847, UEM: 0.5615, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4792, partial_loss/deprel_loss: 0.6233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.8099, batch_reg_loss: 0.1588, reg_loss: 0.1582 ||: 80%|######## | 76/95 [00:52<00:13, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9378, LAS: 0.8848, UEM: 0.5582, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4244, partial_loss/deprel_loss: 0.5378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6739, loss: 0.8090, batch_reg_loss: 0.1589, reg_loss: 0.1582 ||: 83%|########3 | 79/95 [00:54<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9391, LAS: 0.8863, UEM: 0.5690, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2843, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6026, loss: 0.7994, batch_reg_loss: 0.1589, reg_loss: 0.1582 ||: 87%|########7 | 83/95 [00:56<00:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9388, LAS: 0.8860, UEM: 0.5645, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.5243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6545, loss: 0.8033, batch_reg_loss: 0.1590, reg_loss: 0.1583 ||: 92%|#########1| 87/95 [00:59<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9383, LAS: 0.8854, UEM: 0.5636, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3970, partial_loss/deprel_loss: 0.5750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.8081, batch_reg_loss: 0.1590, reg_loss: 0.1583 ||: 95%|#########4| 90/95 [01:01<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9389, LAS: 0.8861, UEM: 0.5803, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1318, partial_loss/deprel_loss: 0.2567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3908, loss: 0.8016, batch_reg_loss: 0.1591, reg_loss: 0.1583 ||: 98%|#########7| 93/95 [01:04<00:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9389, LAS: 0.8862, UEM: 0.5780, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3488, partial_loss/deprel_loss: 0.5293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6523, loss: 0.8017, batch_reg_loss: 0.1591, reg_loss: 0.1583 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - reg_loss | 0.158 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UEM | 0.578 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - LEM | 0.329 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EM | 0.904 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.349 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.529 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - LAS | 0.886 | N/A\n", + "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.trainer - Epoch duration: 0:01:05.378838\n", + "2023-04-06 23:56:08,967 - INFO - combo.training.trainer - Estimated training time remaining: 6:24:36\n", + "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - Epoch 59/399\n", + "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:56:08,972 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9668, LAS: 0.9214, UEM: 0.8388, LEM: 0.6739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 0.4612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5710, loss: 0.5334, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 3%|3 | 3/95 [00:02<01:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9447, LAS: 0.8962, UEM: 0.7278, LEM: 0.5356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4894, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.7324, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||: 7%|7 | 7/95 [00:04<01:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9368, LAS: 0.8860, UEM: 0.6479, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.4918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6231, loss: 0.7971, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||: 12%|#1 | 11/95 [00:07<00:59, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9405, LAS: 0.8894, UEM: 0.6198, LEM: 0.4015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4050, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6315, loss: 0.7755, batch_reg_loss: 0.1593, reg_loss: 0.1592 ||: 16%|#5 | 15/95 [00:09<00:54, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9432, LAS: 0.8910, UEM: 0.6084, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4418, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 0.7605, batch_reg_loss: 0.1594, reg_loss: 0.1592 ||: 20%|## | 19/95 [00:12<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9429, LAS: 0.8900, UEM: 0.5828, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.7659, batch_reg_loss: 0.1594, reg_loss: 0.1593 ||: 24%|##4 | 23/95 [00:15<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9435, LAS: 0.8912, UEM: 0.6006, LEM: 0.3587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2167, partial_loss/deprel_loss: 0.3695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.7566, batch_reg_loss: 0.1595, reg_loss: 0.1593 ||: 27%|##7 | 26/95 [00:17<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9447, LAS: 0.8927, UEM: 0.6153, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.5664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6906, loss: 0.7423, batch_reg_loss: 0.1595, reg_loss: 0.1593 ||: 31%|### | 29/95 [00:19<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9444, LAS: 0.8926, UEM: 0.6101, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9486, partial_loss/deprel_loss: 0.8810, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0541, loss: 0.7445, batch_reg_loss: 0.1596, reg_loss: 0.1593 ||: 35%|###4 | 33/95 [00:22<00:42, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9452, LAS: 0.8934, UEM: 0.6117, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.7371, batch_reg_loss: 0.1596, reg_loss: 0.1594 ||: 38%|###7 | 36/95 [00:24<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9432, LAS: 0.8910, UEM: 0.5908, LEM: 0.3416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6523, partial_loss/deprel_loss: 0.6621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8198, loss: 0.7559, batch_reg_loss: 0.1597, reg_loss: 0.1594 ||: 42%|####2 | 40/95 [00:26<00:35, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9442, LAS: 0.8916, UEM: 0.5983, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6514, partial_loss/deprel_loss: 0.7769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9115, loss: 0.7486, batch_reg_loss: 0.1597, reg_loss: 0.1594 ||: 47%|####7 | 45/95 [00:29<00:30, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9431, LAS: 0.8904, UEM: 0.5858, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4181, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7236, loss: 0.7604, batch_reg_loss: 0.1598, reg_loss: 0.1595 ||: 52%|#####1 | 49/95 [00:31<00:27, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9424, LAS: 0.8899, UEM: 0.5948, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6893, partial_loss/deprel_loss: 0.6942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8530, loss: 0.7647, batch_reg_loss: 0.1598, reg_loss: 0.1595 ||: 56%|#####5 | 53/95 [00:33<00:25, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9434, LAS: 0.8910, UEM: 0.6033, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5567, loss: 0.7560, batch_reg_loss: 0.1599, reg_loss: 0.1595 ||: 60%|###### | 57/95 [00:36<00:24, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9424, LAS: 0.8897, UEM: 0.5927, LEM: 0.3424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9398, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0086, loss: 0.7681, batch_reg_loss: 0.1600, reg_loss: 0.1595 ||: 64%|######4 | 61/95 [00:39<00:21, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9415, LAS: 0.8887, UEM: 0.5846, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1753, partial_loss/deprel_loss: 0.8177, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0493, loss: 0.7768, batch_reg_loss: 0.1600, reg_loss: 0.1596 ||: 68%|######8 | 65/95 [00:41<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.9403, LAS: 0.8875, UEM: 0.5899, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4067, partial_loss/deprel_loss: 0.9934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 0.7864, batch_reg_loss: 0.1601, reg_loss: 0.1596 ||: 73%|#######2 | 69/95 [00:44<00:16, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9406, LAS: 0.8879, UEM: 0.5918, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.5143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.7834, batch_reg_loss: 0.1602, reg_loss: 0.1596 ||: 77%|#######6 | 73/95 [00:47<00:14, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9404, LAS: 0.8874, UEM: 0.5856, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6402, partial_loss/deprel_loss: 0.7421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8819, loss: 0.7881, batch_reg_loss: 0.1602, reg_loss: 0.1597 ||: 81%|########1 | 77/95 [00:49<00:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9396, LAS: 0.8863, UEM: 0.5803, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0770, partial_loss/deprel_loss: 0.9965, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1729, loss: 0.7966, batch_reg_loss: 0.1603, reg_loss: 0.1597 ||: 85%|########5 | 81/95 [00:52<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9397, LAS: 0.8863, UEM: 0.5751, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4392, partial_loss/deprel_loss: 0.6400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.7989, batch_reg_loss: 0.1604, reg_loss: 0.1597 ||: 89%|########9 | 85/95 [00:55<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9386, LAS: 0.8850, UEM: 0.5739, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3208, partial_loss/deprel_loss: 0.4776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6067, loss: 0.8075, batch_reg_loss: 0.1604, reg_loss: 0.1597 ||: 93%|#########2| 88/95 [00:57<00:04, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9392, LAS: 0.8857, UEM: 0.5768, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1678, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.8025, batch_reg_loss: 0.1605, reg_loss: 0.1598 ||: 96%|#########5| 91/95 [00:59<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9391, LAS: 0.8854, UEM: 0.5732, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6358, loss: 0.8066, batch_reg_loss: 0.1606, reg_loss: 0.1598 ||: 100%|##########| 95/95 [01:02<00:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9391, LAS: 0.8854, UEM: 0.5732, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6358, loss: 0.8066, batch_reg_loss: 0.1606, reg_loss: 0.1598 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UEM | 0.573 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - LEM | 0.328 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EM | 0.911 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.324 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.513 | N/A\n", + "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - loss | 0.807 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - LAS | 0.885 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.trainer - Epoch duration: 0:01:02.164157\n", + "2023-04-06 23:57:11,131 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:57\n", + "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - Epoch 60/399\n", + "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:57:11,137 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9245, LAS: 0.8735, UEM: 0.5809, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2835, partial_loss/deprel_loss: 0.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 0.8867, batch_reg_loss: 0.1606, reg_loss: 0.1606 ||: 4%|4 | 4/95 [00:02<00:52, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9349, LAS: 0.8832, UEM: 0.5488, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6060, partial_loss/deprel_loss: 0.6525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8039, loss: 0.8042, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||: 8%|8 | 8/95 [00:04<00:51, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9444, LAS: 0.8942, UEM: 0.6930, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0510, partial_loss/deprel_loss: 0.1657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3035, loss: 0.7286, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||: 12%|#1 | 11/95 [00:07<00:55, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9423, LAS: 0.8906, UEM: 0.6329, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4824, partial_loss/deprel_loss: 0.5800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.7588, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||: 16%|#5 | 15/95 [00:09<00:52, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9417, LAS: 0.8896, UEM: 0.5919, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5967, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7751, loss: 0.7680, batch_reg_loss: 0.1609, reg_loss: 0.1607 ||: 20%|## | 19/95 [00:12<00:48, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9428, LAS: 0.8911, UEM: 0.5764, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6191, partial_loss/deprel_loss: 0.6637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.7589, batch_reg_loss: 0.1609, reg_loss: 0.1608 ||: 24%|##4 | 23/95 [00:14<00:46, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9457, LAS: 0.8947, UEM: 0.6226, LEM: 0.3809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3466, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6113, loss: 0.7316, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||: 27%|##7 | 26/95 [00:17<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8313, UAS: 0.9451, LAS: 0.8939, UEM: 0.6225, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4179, partial_loss/deprel_loss: 0.9926, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2387, loss: 0.7391, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||: 32%|###1 | 30/95 [00:19<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9444, LAS: 0.8931, UEM: 0.6279, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1271, partial_loss/deprel_loss: 0.3208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.7458, batch_reg_loss: 0.1611, reg_loss: 0.1609 ||: 36%|###5 | 34/95 [00:22<00:40, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8490, UAS: 0.9430, LAS: 0.8910, UEM: 0.6072, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0711, partial_loss/deprel_loss: 0.9718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1528, loss: 0.7647, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||: 40%|#### | 38/95 [00:24<00:36, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9420, LAS: 0.8900, UEM: 0.6056, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8198, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9473, loss: 0.7771, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||: 44%|####4 | 42/95 [00:27<00:34, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9430, LAS: 0.8911, UEM: 0.6079, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3948, partial_loss/deprel_loss: 0.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.7663, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||: 48%|####8 | 46/95 [00:30<00:32, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8200, UAS: 0.9429, LAS: 0.8905, UEM: 0.6061, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4237, partial_loss/deprel_loss: 1.1122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3359, loss: 0.7717, batch_reg_loss: 0.1613, reg_loss: 0.1610 ||: 53%|#####2 | 50/95 [00:32<00:29, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9439, LAS: 0.8916, UEM: 0.6126, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2412, partial_loss/deprel_loss: 0.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.7624, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||: 57%|#####6 | 54/95 [00:35<00:26, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9429, LAS: 0.8902, UEM: 0.6016, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.4670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5842, loss: 0.7729, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||: 61%|######1 | 58/95 [00:37<00:24, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9441, LAS: 0.8919, UEM: 0.6137, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4000, partial_loss/deprel_loss: 0.6110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7303, loss: 0.7600, batch_reg_loss: 0.1615, reg_loss: 0.1611 ||: 65%|######5 | 62/95 [00:40<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9432, LAS: 0.8905, UEM: 0.6067, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3855, partial_loss/deprel_loss: 0.5793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7021, loss: 0.7705, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||: 69%|######9 | 66/95 [00:43<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9421, LAS: 0.8893, UEM: 0.5971, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6925, partial_loss/deprel_loss: 0.7960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9369, loss: 0.7804, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||: 74%|#######3 | 70/95 [00:46<00:16, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9419, LAS: 0.8890, UEM: 0.5929, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6348, loss: 0.7832, batch_reg_loss: 0.1617, reg_loss: 0.1612 ||: 78%|#######7 | 74/95 [00:48<00:13, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9421, LAS: 0.8892, UEM: 0.5903, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5034, partial_loss/deprel_loss: 0.6401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7745, loss: 0.7812, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||: 82%|########2 | 78/95 [00:51<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9411, LAS: 0.8881, UEM: 0.5903, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4647, partial_loss/deprel_loss: 0.5666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7081, loss: 0.7896, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||: 86%|########6 | 82/95 [00:54<00:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9410, LAS: 0.8880, UEM: 0.5907, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8185, partial_loss/deprel_loss: 0.7277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9077, loss: 0.7905, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||: 89%|########9 | 85/95 [00:56<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9406, LAS: 0.8877, UEM: 0.5881, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8441, partial_loss/deprel_loss: 0.7880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9612, loss: 0.7938, batch_reg_loss: 0.1619, reg_loss: 0.1613 ||: 93%|#########2| 88/95 [00:58<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9403, LAS: 0.8873, UEM: 0.5851, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.4747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.7959, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||: 97%|#########6| 92/95 [01:00<00:01, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9398, LAS: 0.8866, UEM: 0.5784, LEM: 0.3320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 0.7983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.8016, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-06 23:58:13,320 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9560, LAS: 0.9073, UEM: 0.8034, LEM: 0.6181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 19.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9847, loss: 26.0149, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9476, LAS: 0.8960, UEM: 0.7225, LEM: 0.5025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1885, partial_loss/deprel_loss: 22.8232, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2962, loss: 29.0160, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9471, LAS: 0.8934, UEM: 0.6713, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5159, partial_loss/deprel_loss: 24.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6260, loss: 26.5097, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.10it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9489, LAS: 0.8961, UEM: 0.6698, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 28.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7947, loss: 26.7813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9489, LAS: 0.8961, UEM: 0.6698, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 28.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7947, loss: 26.7813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.16it/s]\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - reg_loss | 0.161 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UEM | 0.578 | 0.670\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - LEM | 0.332 | 0.399\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EM | 0.870 | 0.928\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.862 | 0.300\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | 0.949\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.798 | 28.418\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - loss | 0.802 | 26.781\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - LAS | 0.887 | 0.896\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.trainer - Epoch duration: 0:01:11.674813\n", + "2023-04-06 23:58:22,806 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:13\n", + "2023-04-06 23:58:22,806 - INFO - allennlp.training.trainer - Epoch 61/399\n", + "2023-04-06 23:58:22,807 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:58:22,807 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:58:22,813 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9493, LAS: 0.9001, UEM: 0.5113, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.4222, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5657, loss: 0.6838, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9380, LAS: 0.8878, UEM: 0.4589, LEM: 0.2282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9957, partial_loss/deprel_loss: 0.8262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0223, loss: 0.7848, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||: 6%|6 | 6/95 [00:04<01:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9442, LAS: 0.8942, UEM: 0.5610, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2538, partial_loss/deprel_loss: 0.4180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.7266, batch_reg_loss: 0.1622, reg_loss: 0.1621 ||: 9%|9 | 9/95 [00:06<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9430, LAS: 0.8916, UEM: 0.5512, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1657, partial_loss/deprel_loss: 0.3888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.7471, batch_reg_loss: 0.1623, reg_loss: 0.1622 ||: 14%|#3 | 13/95 [00:09<00:58, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9446, LAS: 0.8934, UEM: 0.5710, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7792, partial_loss/deprel_loss: 0.8112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9671, loss: 0.7342, batch_reg_loss: 0.1623, reg_loss: 0.1622 ||: 17%|#6 | 16/95 [00:11<00:58, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9461, LAS: 0.8949, UEM: 0.5937, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1852, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4918, loss: 0.7225, batch_reg_loss: 0.1624, reg_loss: 0.1622 ||: 20%|## | 19/95 [00:13<00:55, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9465, LAS: 0.8951, UEM: 0.6055, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2041, partial_loss/deprel_loss: 0.4017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.7280, batch_reg_loss: 0.1624, reg_loss: 0.1622 ||: 24%|##4 | 23/95 [00:16<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9466, LAS: 0.8947, UEM: 0.6008, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1822, partial_loss/deprel_loss: 0.4087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5258, loss: 0.7323, batch_reg_loss: 0.1625, reg_loss: 0.1623 ||: 28%|##8 | 27/95 [00:18<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9436, LAS: 0.8907, UEM: 0.5673, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9718, partial_loss/deprel_loss: 0.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0251, loss: 0.7632, batch_reg_loss: 0.1625, reg_loss: 0.1623 ||: 33%|###2 | 31/95 [00:21<00:41, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9424, LAS: 0.8898, UEM: 0.5869, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0540, partial_loss/deprel_loss: 0.8374, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0433, loss: 0.7694, batch_reg_loss: 0.1626, reg_loss: 0.1623 ||: 37%|###6 | 35/95 [00:23<00:39, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9438, LAS: 0.8912, UEM: 0.6027, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1477, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4227, loss: 0.7581, batch_reg_loss: 0.1626, reg_loss: 0.1624 ||: 40%|#### | 38/95 [00:26<00:38, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9432, LAS: 0.8908, UEM: 0.5884, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4037, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6594, loss: 0.7604, batch_reg_loss: 0.1627, reg_loss: 0.1624 ||: 44%|####4 | 42/95 [00:28<00:35, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9408, LAS: 0.8881, UEM: 0.5801, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0877, partial_loss/deprel_loss: 0.9107, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1088, loss: 0.7804, batch_reg_loss: 0.1627, reg_loss: 0.1624 ||: 47%|####7 | 45/95 [00:30<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7994, UAS: 0.9375, LAS: 0.8846, UEM: 0.5655, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7998, partial_loss/deprel_loss: 1.0932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3973, loss: 0.8055, batch_reg_loss: 0.1628, reg_loss: 0.1624 ||: 52%|#####1 | 49/95 [00:33<00:29, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9374, LAS: 0.8844, UEM: 0.5565, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4351, partial_loss/deprel_loss: 0.5761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7108, loss: 0.8063, batch_reg_loss: 0.1629, reg_loss: 0.1625 ||: 56%|#####5 | 53/95 [00:35<00:26, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9384, LAS: 0.8854, UEM: 0.5557, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3168, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.7999, batch_reg_loss: 0.1630, reg_loss: 0.1625 ||: 60%|###### | 57/95 [00:37<00:23, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9392, LAS: 0.8863, UEM: 0.5548, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6487, loss: 0.7932, batch_reg_loss: 0.1630, reg_loss: 0.1625 ||: 64%|######4 | 61/95 [00:40<00:21, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9395, LAS: 0.8864, UEM: 0.5497, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6822, partial_loss/deprel_loss: 0.7306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8841, loss: 0.7922, batch_reg_loss: 0.1631, reg_loss: 0.1626 ||: 68%|######8 | 65/95 [00:43<00:20, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8188, UAS: 0.9390, LAS: 0.8860, UEM: 0.5673, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5033, partial_loss/deprel_loss: 1.0465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3010, loss: 0.7974, batch_reg_loss: 0.1632, reg_loss: 0.1626 ||: 73%|#######2 | 69/95 [00:46<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9401, LAS: 0.8873, UEM: 0.5793, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2484, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5615, loss: 0.7877, batch_reg_loss: 0.1632, reg_loss: 0.1626 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9407, LAS: 0.8878, UEM: 0.5868, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7300, partial_loss/deprel_loss: 0.7953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9455, loss: 0.7839, batch_reg_loss: 0.1633, reg_loss: 0.1627 ||: 79%|#######8 | 75/95 [00:50<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9402, LAS: 0.8873, UEM: 0.5855, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2602, partial_loss/deprel_loss: 0.4101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7891, batch_reg_loss: 0.1633, reg_loss: 0.1627 ||: 83%|########3 | 79/95 [00:53<00:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9404, LAS: 0.8876, UEM: 0.5859, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2909, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5461, loss: 0.7864, batch_reg_loss: 0.1634, reg_loss: 0.1627 ||: 86%|########6 | 82/95 [00:55<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9407, LAS: 0.8877, UEM: 0.5833, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6463, partial_loss/deprel_loss: 0.7100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8607, loss: 0.7867, batch_reg_loss: 0.1634, reg_loss: 0.1627 ||: 91%|######### | 86/95 [00:57<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9406, LAS: 0.8875, UEM: 0.5804, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5472, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7836, loss: 0.7904, batch_reg_loss: 0.1635, reg_loss: 0.1628 ||: 95%|#########4| 90/95 [01:00<00:03, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9395, LAS: 0.8861, UEM: 0.5729, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7152, loss: 0.8014, batch_reg_loss: 0.1635, reg_loss: 0.1628 ||: 99%|#########8| 94/95 [01:02<00:00, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9398, LAS: 0.8863, UEM: 0.5764, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2508, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5663, loss: 0.7989, batch_reg_loss: 0.1636, reg_loss: 0.1628 ||: 100%|##########| 95/95 [01:03<00:00, 1.51it/s]\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - reg_loss | 0.163 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - UEM | 0.576 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - LEM | 0.329 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EM | 0.906 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.251 | N/A\n", + "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.441 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - loss | 0.799 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - LAS | 0.886 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:25,922 - INFO - combo.training.trainer - Epoch duration: 0:01:03.115203\n", + "2023-04-06 23:59:25,922 - INFO - combo.training.trainer - Estimated training time remaining: 6:20:40\n", + "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - Epoch 62/399\n", + "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:59:25,928 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9352, LAS: 0.8864, UEM: 0.6689, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1004, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.8111, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9423, LAS: 0.8922, UEM: 0.5717, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6524, partial_loss/deprel_loss: 0.7108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8628, loss: 0.7538, batch_reg_loss: 0.1637, reg_loss: 0.1636 ||: 7%|7 | 7/95 [00:04<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9436, LAS: 0.8937, UEM: 0.6140, LEM: 0.3753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9611, partial_loss/deprel_loss: 0.8192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0113, loss: 0.7286, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 11%|# | 10/95 [00:06<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9404, LAS: 0.8906, UEM: 0.5818, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7859, partial_loss/deprel_loss: 0.7698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9368, loss: 0.7612, batch_reg_loss: 0.1638, reg_loss: 0.1637 ||: 15%|#4 | 14/95 [00:09<00:54, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9457, LAS: 0.8979, UEM: 0.6694, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.7118, batch_reg_loss: 0.1638, reg_loss: 0.1637 ||: 18%|#7 | 17/95 [00:11<00:55, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9462, LAS: 0.8974, UEM: 0.6547, LEM: 0.4268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6472, partial_loss/deprel_loss: 0.7830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9197, loss: 0.7198, batch_reg_loss: 0.1639, reg_loss: 0.1637 ||: 21%|##1 | 20/95 [00:13<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9451, LAS: 0.8964, UEM: 0.6450, LEM: 0.4199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0052, loss: 0.7245, batch_reg_loss: 0.1639, reg_loss: 0.1638 ||: 24%|##4 | 23/95 [00:16<00:51, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9416, LAS: 0.8921, UEM: 0.6166, LEM: 0.3929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6848, partial_loss/deprel_loss: 0.7441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.7624, batch_reg_loss: 0.1640, reg_loss: 0.1638 ||: 28%|##8 | 27/95 [00:18<00:46, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9440, LAS: 0.8946, UEM: 0.6354, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.4524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5808, loss: 0.7425, batch_reg_loss: 0.1640, reg_loss: 0.1638 ||: 32%|###1 | 30/95 [00:20<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9422, LAS: 0.8927, UEM: 0.6160, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0462, partial_loss/deprel_loss: 0.8503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0535, loss: 0.7598, batch_reg_loss: 0.1641, reg_loss: 0.1638 ||: 36%|###5 | 34/95 [00:22<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9412, LAS: 0.8911, UEM: 0.5973, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6510, partial_loss/deprel_loss: 0.6828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8406, loss: 0.7688, batch_reg_loss: 0.1641, reg_loss: 0.1639 ||: 40%|#### | 38/95 [00:25<00:36, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9415, LAS: 0.8911, UEM: 0.5952, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8107, partial_loss/deprel_loss: 0.7510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9271, loss: 0.7698, batch_reg_loss: 0.1642, reg_loss: 0.1639 ||: 44%|####4 | 42/95 [00:28<00:34, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9412, LAS: 0.8902, UEM: 0.5865, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0094, partial_loss/deprel_loss: 0.8746, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0658, loss: 0.7748, batch_reg_loss: 0.1642, reg_loss: 0.1639 ||: 48%|####8 | 46/95 [00:30<00:31, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9409, LAS: 0.8899, UEM: 0.5940, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5632, partial_loss/deprel_loss: 0.7819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9025, loss: 0.7776, batch_reg_loss: 0.1643, reg_loss: 0.1640 ||: 53%|#####2 | 50/95 [00:33<00:29, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9404, LAS: 0.8896, UEM: 0.6009, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.7804, batch_reg_loss: 0.1644, reg_loss: 0.1640 ||: 57%|#####6 | 54/95 [00:36<00:27, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9396, LAS: 0.8884, UEM: 0.5930, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5070, partial_loss/deprel_loss: 0.6170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7874, batch_reg_loss: 0.1644, reg_loss: 0.1640 ||: 61%|######1 | 58/95 [00:38<00:24, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9398, LAS: 0.8883, UEM: 0.5847, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.7893, batch_reg_loss: 0.1645, reg_loss: 0.1640 ||: 65%|######5 | 62/95 [00:41<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9405, LAS: 0.8889, UEM: 0.5865, LEM: 0.3500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3470, partial_loss/deprel_loss: 0.5598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6818, loss: 0.7835, batch_reg_loss: 0.1645, reg_loss: 0.1641 ||: 68%|######8 | 65/95 [00:44<00:21, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9407, LAS: 0.8892, UEM: 0.5836, LEM: 0.3467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3367, partial_loss/deprel_loss: 0.4958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6286, loss: 0.7819, batch_reg_loss: 0.1646, reg_loss: 0.1641 ||: 72%|#######1 | 68/95 [00:46<00:19, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8300, UAS: 0.9397, LAS: 0.8878, UEM: 0.5751, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3214, partial_loss/deprel_loss: 0.9422, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1827, loss: 0.7904, batch_reg_loss: 0.1646, reg_loss: 0.1641 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9409, LAS: 0.8891, UEM: 0.5931, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1709, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4959, loss: 0.7792, batch_reg_loss: 0.1647, reg_loss: 0.1641 ||: 78%|#######7 | 74/95 [00:50<00:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9412, LAS: 0.8893, UEM: 0.5962, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1853, partial_loss/deprel_loss: 0.3972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.7765, batch_reg_loss: 0.1647, reg_loss: 0.1642 ||: 81%|########1 | 77/95 [00:52<00:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9410, LAS: 0.8891, UEM: 0.5931, LEM: 0.3533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0801, partial_loss/deprel_loss: 0.9144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1123, loss: 0.7780, batch_reg_loss: 0.1648, reg_loss: 0.1642 ||: 84%|########4 | 80/95 [00:54<00:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9405, LAS: 0.8886, UEM: 0.5904, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2335, partial_loss/deprel_loss: 0.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.7813, batch_reg_loss: 0.1648, reg_loss: 0.1642 ||: 88%|########8 | 84/95 [00:57<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9401, LAS: 0.8881, UEM: 0.5874, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5134, partial_loss/deprel_loss: 0.5706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.7856, batch_reg_loss: 0.1649, reg_loss: 0.1642 ||: 93%|#########2| 88/95 [00:59<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9391, LAS: 0.8870, UEM: 0.5827, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1079, partial_loss/deprel_loss: 1.1986, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5454, loss: 0.7937, batch_reg_loss: 0.1649, reg_loss: 0.1643 ||: 96%|#########5| 91/95 [01:02<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9392, LAS: 0.8870, UEM: 0.5792, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6370, loss: 0.7949, batch_reg_loss: 0.1650, reg_loss: 0.1643 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9392, LAS: 0.8870, UEM: 0.5792, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6370, loss: 0.7949, batch_reg_loss: 0.1650, reg_loss: 0.1643 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - reg_loss | 0.164 | N/A\n", + "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LEM | 0.338 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - EM | 0.907 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.285 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.519 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - loss | 0.795 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LAS | 0.887 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:00:30,729 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:30,729 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:30,729 - INFO - combo.training.trainer - Epoch duration: 0:01:04.807186\n", + "2023-04-07 00:00:30,729 - INFO - combo.training.trainer - Estimated training time remaining: 6:19:18\n", + "2023-04-07 00:00:30,729 - INFO - allennlp.training.trainer - Epoch 63/399\n", + "2023-04-07 00:00:30,729 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:00:30,730 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:00:30,735 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9214, LAS: 0.8709, UEM: 0.3921, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3276, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.9274, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||: 4%|4 | 4/95 [00:02<01:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8297, UAS: 0.9183, LAS: 0.8660, UEM: 0.3468, LEM: 0.1579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3947, partial_loss/deprel_loss: 0.8886, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1549, loss: 0.9582, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||: 7%|7 | 7/95 [00:04<00:59, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9267, LAS: 0.8754, UEM: 0.4078, LEM: 0.2043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6982, partial_loss/deprel_loss: 0.7160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8776, loss: 0.8958, batch_reg_loss: 0.1652, reg_loss: 0.1651 ||: 12%|#1 | 11/95 [00:06<00:52, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9305, LAS: 0.8789, UEM: 0.4726, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0189, partial_loss/deprel_loss: 0.8535, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0519, loss: 0.8685, batch_reg_loss: 0.1653, reg_loss: 0.1652 ||: 16%|#5 | 15/95 [00:09<00:49, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9332, LAS: 0.8818, UEM: 0.4824, LEM: 0.2443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5805, partial_loss/deprel_loss: 0.7069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8470, loss: 0.8474, batch_reg_loss: 0.1653, reg_loss: 0.1652 ||: 19%|#8 | 18/95 [00:11<00:48, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9346, LAS: 0.8828, UEM: 0.4713, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.6779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8016, loss: 0.8447, batch_reg_loss: 0.1654, reg_loss: 0.1652 ||: 22%|##2 | 21/95 [00:13<00:48, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9343, LAS: 0.8826, UEM: 0.4678, LEM: 0.2258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2384, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5646, loss: 0.8508, batch_reg_loss: 0.1655, reg_loss: 0.1652 ||: 26%|##6 | 25/95 [00:15<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9365, LAS: 0.8847, UEM: 0.5053, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6228, partial_loss/deprel_loss: 0.7041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8533, loss: 0.8323, batch_reg_loss: 0.1655, reg_loss: 0.1653 ||: 31%|### | 29/95 [00:18<00:43, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9382, LAS: 0.8863, UEM: 0.5066, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4859, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7441, loss: 0.8173, batch_reg_loss: 0.1656, reg_loss: 0.1653 ||: 35%|###4 | 33/95 [00:21<00:40, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9401, LAS: 0.8883, UEM: 0.5258, LEM: 0.2682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.5999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7378, loss: 0.8021, batch_reg_loss: 0.1656, reg_loss: 0.1653 ||: 38%|###7 | 36/95 [00:23<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9416, LAS: 0.8898, UEM: 0.5378, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3752, partial_loss/deprel_loss: 0.4718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6181, loss: 0.7879, batch_reg_loss: 0.1656, reg_loss: 0.1654 ||: 41%|####1 | 39/95 [00:25<00:38, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9415, LAS: 0.8892, UEM: 0.5376, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.4684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5834, loss: 0.7905, batch_reg_loss: 0.1657, reg_loss: 0.1654 ||: 45%|####5 | 43/95 [00:27<00:34, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9408, LAS: 0.8884, UEM: 0.5277, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7331, partial_loss/deprel_loss: 0.7146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8840, loss: 0.7976, batch_reg_loss: 0.1657, reg_loss: 0.1654 ||: 48%|####8 | 46/95 [00:29<00:32, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9413, LAS: 0.8890, UEM: 0.5571, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3109, loss: 0.7932, batch_reg_loss: 0.1658, reg_loss: 0.1654 ||: 53%|#####2 | 50/95 [00:33<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9382, LAS: 0.8855, UEM: 0.5419, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8462, partial_loss/deprel_loss: 0.8174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9890, loss: 0.8220, batch_reg_loss: 0.1658, reg_loss: 0.1655 ||: 57%|#####6 | 54/95 [00:35<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8002, UAS: 0.9376, LAS: 0.8850, UEM: 0.5406, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9688, partial_loss/deprel_loss: 1.1840, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5069, loss: 0.8260, batch_reg_loss: 0.1659, reg_loss: 0.1655 ||: 61%|######1 | 58/95 [00:38<00:24, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9384, LAS: 0.8859, UEM: 0.5466, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.8189, batch_reg_loss: 0.1659, reg_loss: 0.1655 ||: 64%|######4 | 61/95 [00:40<00:23, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9396, LAS: 0.8873, UEM: 0.5644, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.8056, batch_reg_loss: 0.1660, reg_loss: 0.1655 ||: 67%|######7 | 64/95 [00:42<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9396, LAS: 0.8872, UEM: 0.5700, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1402, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4796, loss: 0.8043, batch_reg_loss: 0.1660, reg_loss: 0.1656 ||: 71%|####### | 67/95 [00:44<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9395, LAS: 0.8872, UEM: 0.5704, LEM: 0.3235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6865, loss: 0.8056, batch_reg_loss: 0.1661, reg_loss: 0.1656 ||: 75%|#######4 | 71/95 [00:47<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9397, LAS: 0.8872, UEM: 0.5716, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5127, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8010, loss: 0.8049, batch_reg_loss: 0.1661, reg_loss: 0.1656 ||: 78%|#######7 | 74/95 [00:49<00:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9397, LAS: 0.8872, UEM: 0.5663, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5178, partial_loss/deprel_loss: 0.6335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7766, loss: 0.8046, batch_reg_loss: 0.1662, reg_loss: 0.1656 ||: 81%|########1 | 77/95 [00:51<00:12, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9391, LAS: 0.8865, UEM: 0.5645, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3299, partial_loss/deprel_loss: 0.9747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2120, loss: 0.8106, batch_reg_loss: 0.1662, reg_loss: 0.1657 ||: 84%|########4 | 80/95 [00:54<00:10, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9400, LAS: 0.8874, UEM: 0.5756, LEM: 0.3282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2448, partial_loss/deprel_loss: 0.5046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6189, loss: 0.8024, batch_reg_loss: 0.1663, reg_loss: 0.1657 ||: 87%|########7 | 83/95 [00:56<00:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9407, LAS: 0.8882, UEM: 0.5854, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3117, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5940, loss: 0.7962, batch_reg_loss: 0.1663, reg_loss: 0.1657 ||: 91%|######### | 86/95 [00:58<00:06, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9402, LAS: 0.8877, UEM: 0.5813, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9233, partial_loss/deprel_loss: 0.7878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9813, loss: 0.8002, batch_reg_loss: 0.1664, reg_loss: 0.1657 ||: 94%|#########3| 89/95 [01:00<00:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9401, LAS: 0.8875, UEM: 0.5781, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9979, partial_loss/deprel_loss: 0.9188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1010, loss: 0.8021, batch_reg_loss: 0.1664, reg_loss: 0.1657 ||: 97%|#########6| 92/95 [01:02<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9401, LAS: 0.8876, UEM: 0.5794, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1858, partial_loss/deprel_loss: 0.9170, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1372, loss: 0.8015, batch_reg_loss: 0.1665, reg_loss: 0.1658 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - reg_loss | 0.166 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - LEM | 0.335 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EM | 0.851 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.186 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.917 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.trainer - Epoch duration: 0:01:04.680005\n", + "2023-04-07 00:01:35,409 - INFO - combo.training.trainer - Estimated training time remaining: 6:17:55\n", + "2023-04-07 00:01:35,409 - INFO - allennlp.training.trainer - Epoch 64/399\n", + "2023-04-07 00:01:35,410 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:01:35,410 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:01:35,416 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9472, LAS: 0.9002, UEM: 0.5593, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.7240, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 4%|4 | 4/95 [00:02<00:59, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9445, LAS: 0.8949, UEM: 0.5081, LEM: 0.2425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8786, partial_loss/deprel_loss: 0.8800, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0463, loss: 0.7558, batch_reg_loss: 0.1666, reg_loss: 0.1665 ||: 8%|8 | 8/95 [00:04<00:54, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9423, LAS: 0.8919, UEM: 0.4719, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7350, partial_loss/deprel_loss: 0.6780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8560, loss: 0.7743, batch_reg_loss: 0.1666, reg_loss: 0.1666 ||: 13%|#2 | 12/95 [00:07<00:52, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9363, LAS: 0.8857, UEM: 0.5424, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8850, partial_loss/deprel_loss: 0.7542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.8111, batch_reg_loss: 0.1667, reg_loss: 0.1666 ||: 16%|#5 | 15/95 [00:09<00:54, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9363, LAS: 0.8849, UEM: 0.5609, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3685, partial_loss/deprel_loss: 0.9459, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1972, loss: 0.8203, batch_reg_loss: 0.1667, reg_loss: 0.1666 ||: 20%|## | 19/95 [00:12<00:50, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9379, LAS: 0.8866, UEM: 0.5555, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7078, partial_loss/deprel_loss: 0.6756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8488, loss: 0.8055, batch_reg_loss: 0.1668, reg_loss: 0.1666 ||: 24%|##4 | 23/95 [00:14<00:46, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9390, LAS: 0.8881, UEM: 0.5410, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.7956, batch_reg_loss: 0.1669, reg_loss: 0.1667 ||: 28%|##8 | 27/95 [00:17<00:42, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9401, LAS: 0.8887, UEM: 0.5347, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8162, loss: 0.7944, batch_reg_loss: 0.1669, reg_loss: 0.1667 ||: 33%|###2 | 31/95 [00:19<00:38, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9404, LAS: 0.8885, UEM: 0.5455, LEM: 0.2973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4811, partial_loss/deprel_loss: 0.5935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7380, loss: 0.7950, batch_reg_loss: 0.1670, reg_loss: 0.1667 ||: 37%|###6 | 35/95 [00:21<00:37, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9410, LAS: 0.8897, UEM: 0.5818, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3507, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.7895, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||: 41%|####1 | 39/95 [00:25<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9411, LAS: 0.8898, UEM: 0.5699, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4048, partial_loss/deprel_loss: 0.5478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.7894, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||: 44%|####4 | 42/95 [00:28<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8088, UAS: 0.9403, LAS: 0.8891, UEM: 0.5757, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6599, partial_loss/deprel_loss: 1.0256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3196, loss: 0.7933, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||: 47%|####7 | 45/95 [00:30<00:38, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9398, LAS: 0.8885, UEM: 0.5682, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3592, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.7956, batch_reg_loss: 0.1672, reg_loss: 0.1668 ||: 52%|#####1 | 49/95 [00:33<00:35, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9409, LAS: 0.8897, UEM: 0.5873, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2698, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.7860, batch_reg_loss: 0.1672, reg_loss: 0.1669 ||: 55%|#####4 | 52/95 [00:35<00:32, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9411, LAS: 0.8898, UEM: 0.5823, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.7107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8565, loss: 0.7849, batch_reg_loss: 0.1673, reg_loss: 0.1669 ||: 59%|#####8 | 56/95 [00:38<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9406, LAS: 0.8893, UEM: 0.5731, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.7874, batch_reg_loss: 0.1674, reg_loss: 0.1669 ||: 63%|######3 | 60/95 [00:40<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9410, LAS: 0.8894, UEM: 0.5753, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5480, partial_loss/deprel_loss: 0.6567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8024, loss: 0.7839, batch_reg_loss: 0.1674, reg_loss: 0.1670 ||: 67%|######7 | 64/95 [00:43<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9406, LAS: 0.8890, UEM: 0.5698, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2822, partial_loss/deprel_loss: 0.4641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5952, loss: 0.7861, batch_reg_loss: 0.1675, reg_loss: 0.1670 ||: 72%|#######1 | 68/95 [00:46<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9412, LAS: 0.8896, UEM: 0.5707, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5073, partial_loss/deprel_loss: 0.7481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.7817, batch_reg_loss: 0.1675, reg_loss: 0.1670 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8362, UAS: 0.9407, LAS: 0.8891, UEM: 0.5695, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3392, partial_loss/deprel_loss: 1.0263, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2565, loss: 0.7844, batch_reg_loss: 0.1676, reg_loss: 0.1670 ||: 79%|#######8 | 75/95 [00:50<00:13, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9401, LAS: 0.8884, UEM: 0.5636, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4045, partial_loss/deprel_loss: 0.5355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6769, loss: 0.7911, batch_reg_loss: 0.1676, reg_loss: 0.1671 ||: 82%|########2 | 78/95 [00:53<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9406, LAS: 0.8891, UEM: 0.5730, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1452, partial_loss/deprel_loss: 0.3148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4486, loss: 0.7860, batch_reg_loss: 0.1677, reg_loss: 0.1671 ||: 86%|########6 | 82/95 [00:55<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9412, LAS: 0.8897, UEM: 0.5791, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1987, partial_loss/deprel_loss: 0.3826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.7819, batch_reg_loss: 0.1677, reg_loss: 0.1671 ||: 89%|########9 | 85/95 [00:58<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9409, LAS: 0.8892, UEM: 0.5757, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4878, partial_loss/deprel_loss: 0.6423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7792, loss: 0.7858, batch_reg_loss: 0.1678, reg_loss: 0.1671 ||: 93%|#########2| 88/95 [01:00<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9403, LAS: 0.8885, UEM: 0.5799, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3140, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2767, loss: 0.7918, batch_reg_loss: 0.1678, reg_loss: 0.1672 ||: 96%|#########5| 91/95 [01:02<00:02, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9396, LAS: 0.8877, UEM: 0.5755, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4699, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7469, loss: 0.7974, batch_reg_loss: 0.1679, reg_loss: 0.1672 ||: 99%|#########8| 94/95 [01:04<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9399, LAS: 0.8881, UEM: 0.5787, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5194, loss: 0.7945, batch_reg_loss: 0.1679, reg_loss: 0.1672 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - reg_loss | 0.167 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - LEM | 0.337 | N/A\n", + "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EM | 0.919 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.215 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.386 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - loss | 0.795 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:02:40,498 - INFO - combo.training.trainer - Epoch duration: 0:01:05.088427\n", + "2023-04-07 00:02:40,498 - INFO - combo.training.trainer - Estimated training time remaining: 6:16:36\n", + "2023-04-07 00:02:40,498 - INFO - allennlp.training.trainer - Epoch 65/399\n", + "2023-04-07 00:02:40,498 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:02:40,499 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:02:40,505 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9564, LAS: 0.9078, UEM: 0.6076, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4727, partial_loss/deprel_loss: 0.5492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7018, loss: 0.6344, batch_reg_loss: 0.1679, reg_loss: 0.1679 ||: 3%|3 | 3/95 [00:02<01:13, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9593, LAS: 0.9088, UEM: 0.6460, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2772, partial_loss/deprel_loss: 0.5124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.6441, batch_reg_loss: 0.1680, reg_loss: 0.1679 ||: 6%|6 | 6/95 [00:04<01:09, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9529, LAS: 0.9027, UEM: 0.6704, LEM: 0.4140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1125, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3806, loss: 0.6866, batch_reg_loss: 0.1680, reg_loss: 0.1680 ||: 9%|9 | 9/95 [00:06<01:04, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9511, LAS: 0.9012, UEM: 0.6389, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7581, partial_loss/deprel_loss: 0.6781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8622, loss: 0.6975, batch_reg_loss: 0.1681, reg_loss: 0.1680 ||: 13%|#2 | 12/95 [00:08<01:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9522, LAS: 0.9026, UEM: 0.6560, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.6236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.6851, batch_reg_loss: 0.1681, reg_loss: 0.1680 ||: 16%|#5 | 15/95 [00:10<00:58, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9511, LAS: 0.9019, UEM: 0.6863, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8530, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9697, loss: 0.6922, batch_reg_loss: 0.1682, reg_loss: 0.1680 ||: 19%|#8 | 18/95 [00:13<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9495, LAS: 0.8995, UEM: 0.6710, LEM: 0.4392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3663, partial_loss/deprel_loss: 0.5152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6536, loss: 0.7071, batch_reg_loss: 0.1682, reg_loss: 0.1681 ||: 23%|##3 | 22/95 [00:15<00:51, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9493, LAS: 0.8991, UEM: 0.6559, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.7120, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||: 26%|##6 | 25/95 [00:17<00:50, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9492, LAS: 0.8993, UEM: 0.6571, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5650, loss: 0.7124, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||: 29%|##9 | 28/95 [00:19<00:47, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8608, UAS: 0.9469, LAS: 0.8965, UEM: 0.6418, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9097, partial_loss/deprel_loss: 0.8116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9995, loss: 0.7314, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||: 34%|###3 | 32/95 [00:22<00:42, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9467, LAS: 0.8962, UEM: 0.6360, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7673, partial_loss/deprel_loss: 0.7183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8965, loss: 0.7326, batch_reg_loss: 0.1684, reg_loss: 0.1682 ||: 38%|###7 | 36/95 [00:24<00:38, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9472, LAS: 0.8970, UEM: 0.6440, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2836, partial_loss/deprel_loss: 0.4544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5887, loss: 0.7272, batch_reg_loss: 0.1684, reg_loss: 0.1682 ||: 42%|####2 | 40/95 [00:27<00:35, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9445, LAS: 0.8937, UEM: 0.6242, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5100, partial_loss/deprel_loss: 0.6251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.7519, batch_reg_loss: 0.1685, reg_loss: 0.1682 ||: 46%|####6 | 44/95 [00:29<00:31, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9451, LAS: 0.8943, UEM: 0.6272, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6013, partial_loss/deprel_loss: 0.6473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8067, loss: 0.7459, batch_reg_loss: 0.1685, reg_loss: 0.1682 ||: 51%|##### | 48/95 [00:32<00:29, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9457, LAS: 0.8946, UEM: 0.6246, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2902, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5811, loss: 0.7445, batch_reg_loss: 0.1686, reg_loss: 0.1683 ||: 55%|#####4 | 52/95 [00:35<00:28, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9447, LAS: 0.8932, UEM: 0.6123, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7916, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9691, loss: 0.7550, batch_reg_loss: 0.1687, reg_loss: 0.1683 ||: 59%|#####8 | 56/95 [00:37<00:25, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9437, LAS: 0.8923, UEM: 0.6005, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2806, partial_loss/deprel_loss: 0.9364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1740, loss: 0.7627, batch_reg_loss: 0.1687, reg_loss: 0.1683 ||: 63%|######3 | 60/95 [00:39<00:21, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8578, UAS: 0.9435, LAS: 0.8919, UEM: 0.5947, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9394, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.7646, batch_reg_loss: 0.1688, reg_loss: 0.1683 ||: 67%|######7 | 64/95 [00:42<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9428, LAS: 0.8911, UEM: 0.5987, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2543, partial_loss/deprel_loss: 0.4429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5740, loss: 0.7699, batch_reg_loss: 0.1688, reg_loss: 0.1684 ||: 72%|#######1 | 68/95 [00:45<00:17, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9426, LAS: 0.8908, UEM: 0.5985, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2651, partial_loss/deprel_loss: 0.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5343, loss: 0.7715, batch_reg_loss: 0.1689, reg_loss: 0.1684 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9427, LAS: 0.8907, UEM: 0.5906, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3585, partial_loss/deprel_loss: 0.5088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6477, loss: 0.7718, batch_reg_loss: 0.1690, reg_loss: 0.1684 ||: 80%|######## | 76/95 [00:50<00:12, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9404, LAS: 0.8882, UEM: 0.5791, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3009, partial_loss/deprel_loss: 0.8551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1133, loss: 0.7898, batch_reg_loss: 0.1690, reg_loss: 0.1685 ||: 84%|########4 | 80/95 [00:53<00:09, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8098, UAS: 0.9381, LAS: 0.8858, UEM: 0.5699, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6742, partial_loss/deprel_loss: 1.0952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3801, loss: 0.8083, batch_reg_loss: 0.1691, reg_loss: 0.1685 ||: 88%|########8 | 84/95 [00:55<00:07, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9385, LAS: 0.8863, UEM: 0.5736, LEM: 0.3352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5025, partial_loss/deprel_loss: 0.5241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 0.8038, batch_reg_loss: 0.1692, reg_loss: 0.1685 ||: 93%|#########2| 88/95 [00:58<00:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9391, LAS: 0.8868, UEM: 0.5768, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3505, partial_loss/deprel_loss: 0.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6704, loss: 0.7998, batch_reg_loss: 0.1693, reg_loss: 0.1685 ||: 97%|#########6| 92/95 [01:00<00:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9387, LAS: 0.8862, UEM: 0.5743, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4254, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.8043, batch_reg_loss: 0.1693, reg_loss: 0.1686 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:03:43,247 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9431, LAS: 0.8916, UEM: 0.5405, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3246, partial_loss/deprel_loss: 28.2893, partial_loss/cycle_loss: 0.0000, batch_loss: 22.6963, loss: 28.5523, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9353, LAS: 0.8808, UEM: 0.4659, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4638, partial_loss/deprel_loss: 57.8192, partial_loss/cycle_loss: 0.0000, batch_loss: 46.5482, loss: 31.9561, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9451, LAS: 0.8888, UEM: 0.5769, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5146, partial_loss/deprel_loss: 24.2149, partial_loss/cycle_loss: 0.0000, batch_loss: 19.4748, loss: 27.8085, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.07it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9462, LAS: 0.8915, UEM: 0.6454, LEM: 0.3727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9144, partial_loss/deprel_loss: 44.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 35.7222, loss: 27.4137, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9485, LAS: 0.8950, UEM: 0.6749, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 22.9214, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3801, loss: 26.5925, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01it/s]\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - reg_loss | 0.169 | 0.000\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UEM | 0.574 | 0.675\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - LEM | 0.334 | 0.400\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EM | 0.896 | 0.929\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.425 | 0.215\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | 0.948\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.610 | 22.921\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - loss | 0.804 | 26.592\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - LAS | 0.886 | 0.895\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:54,102 - INFO - combo.training.trainer - Epoch duration: 0:01:13.603661\n", + "2023-04-07 00:03:54,102 - INFO - combo.training.trainer - Estimated training time remaining: 6:15:59\n", + "2023-04-07 00:03:54,102 - INFO - allennlp.training.trainer - Epoch 66/399\n", + "2023-04-07 00:03:54,102 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:03:54,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:03:54,110 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9601, LAS: 0.9097, UEM: 0.7095, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3314, partial_loss/deprel_loss: 0.5307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6602, loss: 0.6498, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 4%|4 | 4/95 [00:02<00:54, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9595, LAS: 0.9089, UEM: 0.7318, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5926, partial_loss/deprel_loss: 0.6805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8324, loss: 0.6449, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 7%|7 | 7/95 [00:04<00:55, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9554, LAS: 0.9035, UEM: 0.6783, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2470, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5369, loss: 0.6774, batch_reg_loss: 0.1695, reg_loss: 0.1694 ||: 12%|#1 | 11/95 [00:06<00:51, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9473, LAS: 0.8944, UEM: 0.6155, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9505, partial_loss/deprel_loss: 0.9103, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0879, loss: 0.7509, batch_reg_loss: 0.1695, reg_loss: 0.1694 ||: 16%|#5 | 15/95 [00:09<00:49, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9481, LAS: 0.8951, UEM: 0.6158, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5815, partial_loss/deprel_loss: 0.6274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7879, loss: 0.7384, batch_reg_loss: 0.1696, reg_loss: 0.1695 ||: 19%|#8 | 18/95 [00:11<00:49, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9467, LAS: 0.8940, UEM: 0.6187, LEM: 0.3435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1853, partial_loss/deprel_loss: 0.9649, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1786, loss: 0.7459, batch_reg_loss: 0.1696, reg_loss: 0.1695 ||: 22%|##2 | 21/95 [00:13<00:48, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9427, LAS: 0.8898, UEM: 0.6051, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4605, partial_loss/deprel_loss: 0.6038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7448, loss: 0.7777, batch_reg_loss: 0.1697, reg_loss: 0.1695 ||: 25%|##5 | 24/95 [00:15<00:46, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9414, LAS: 0.8885, UEM: 0.5777, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6379, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8258, loss: 0.7842, batch_reg_loss: 0.1697, reg_loss: 0.1695 ||: 29%|##9 | 28/95 [00:18<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9420, LAS: 0.8890, UEM: 0.5812, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.7807, batch_reg_loss: 0.1698, reg_loss: 0.1696 ||: 33%|###2 | 31/95 [00:20<00:43, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9431, LAS: 0.8901, UEM: 0.5918, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5835, partial_loss/deprel_loss: 0.7340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8737, loss: 0.7734, batch_reg_loss: 0.1698, reg_loss: 0.1696 ||: 36%|###5 | 34/95 [00:22<00:43, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9435, LAS: 0.8908, UEM: 0.5906, LEM: 0.3209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9176, loss: 0.7715, batch_reg_loss: 0.1699, reg_loss: 0.1696 ||: 39%|###8 | 37/95 [00:24<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9435, LAS: 0.8912, UEM: 0.6163, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1037, partial_loss/deprel_loss: 0.9039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1138, loss: 0.7703, batch_reg_loss: 0.1699, reg_loss: 0.1696 ||: 42%|####2 | 40/95 [00:27<00:41, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9444, LAS: 0.8924, UEM: 0.6293, LEM: 0.3798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1451, partial_loss/deprel_loss: 0.2613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4081, loss: 0.7592, batch_reg_loss: 0.1700, reg_loss: 0.1697 ||: 46%|####6 | 44/95 [00:30<00:37, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9447, LAS: 0.8929, UEM: 0.6220, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.5710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7128, loss: 0.7575, batch_reg_loss: 0.1700, reg_loss: 0.1697 ||: 49%|####9 | 47/95 [00:32<00:36, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9456, LAS: 0.8939, UEM: 0.6293, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4173, partial_loss/deprel_loss: 0.5274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.7488, batch_reg_loss: 0.1701, reg_loss: 0.1697 ||: 53%|#####2 | 50/95 [00:34<00:34, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9451, LAS: 0.8935, UEM: 0.6279, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.7522, batch_reg_loss: 0.1701, reg_loss: 0.1697 ||: 56%|#####5 | 53/95 [00:37<00:32, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9448, LAS: 0.8931, UEM: 0.6190, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.5620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6920, loss: 0.7568, batch_reg_loss: 0.1701, reg_loss: 0.1698 ||: 60%|###### | 57/95 [00:39<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9442, LAS: 0.8929, UEM: 0.6134, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7584, batch_reg_loss: 0.1702, reg_loss: 0.1698 ||: 64%|######4 | 61/95 [00:42<00:24, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9437, LAS: 0.8924, UEM: 0.6152, LEM: 0.3693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0340, partial_loss/deprel_loss: 0.9069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1026, loss: 0.7631, batch_reg_loss: 0.1702, reg_loss: 0.1698 ||: 67%|######7 | 64/95 [00:44<00:22, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9426, LAS: 0.8911, UEM: 0.6056, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6441, partial_loss/deprel_loss: 0.7303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8833, loss: 0.7733, batch_reg_loss: 0.1703, reg_loss: 0.1698 ||: 71%|####### | 67/95 [00:47<00:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9427, LAS: 0.8911, UEM: 0.6021, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2508, partial_loss/deprel_loss: 0.4391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.7728, batch_reg_loss: 0.1703, reg_loss: 0.1698 ||: 74%|#######3 | 70/95 [00:49<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9406, LAS: 0.8890, UEM: 0.5930, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8441, partial_loss/deprel_loss: 0.7311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9241, loss: 0.7889, batch_reg_loss: 0.1704, reg_loss: 0.1699 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9407, LAS: 0.8890, UEM: 0.5944, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.4895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.7878, batch_reg_loss: 0.1704, reg_loss: 0.1699 ||: 81%|########1 | 77/95 [00:53<00:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9409, LAS: 0.8890, UEM: 0.5910, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4703, partial_loss/deprel_loss: 0.5552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7087, loss: 0.7876, batch_reg_loss: 0.1705, reg_loss: 0.1699 ||: 84%|########4 | 80/95 [00:55<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9403, LAS: 0.8882, UEM: 0.5875, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2940, partial_loss/deprel_loss: 0.9074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1553, loss: 0.7936, batch_reg_loss: 0.1706, reg_loss: 0.1699 ||: 88%|########8 | 84/95 [00:58<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9388, LAS: 0.8866, UEM: 0.5830, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6039, loss: 0.8044, batch_reg_loss: 0.1706, reg_loss: 0.1700 ||: 93%|#########2| 88/95 [01:01<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9390, LAS: 0.8868, UEM: 0.5818, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3476, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.8040, batch_reg_loss: 0.1707, reg_loss: 0.1700 ||: 96%|#########5| 91/95 [01:03<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9398, LAS: 0.8876, UEM: 0.5812, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4487, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7212, loss: 0.7984, batch_reg_loss: 0.1708, reg_loss: 0.1700 ||: 100%|##########| 95/95 [01:05<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9398, LAS: 0.8876, UEM: 0.5812, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4487, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7212, loss: 0.7984, batch_reg_loss: 0.1708, reg_loss: 0.1700 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - reg_loss | 0.170 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - UEM | 0.581 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - LEM | 0.334 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EM | 0.899 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.449 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.576 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - loss | 0.798 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:00,017 - INFO - combo.training.trainer - Epoch duration: 0:01:05.914712\n", + "2023-04-07 00:05:00,017 - INFO - combo.training.trainer - Estimated training time remaining: 6:14:44\n", + "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - Epoch 67/399\n", + "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:05:00,024 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9324, LAS: 0.8811, UEM: 0.5772, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 0.7196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8357, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 3%|3 | 3/95 [00:02<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9336, LAS: 0.8826, UEM: 0.6490, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1526, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3954, loss: 0.8197, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9230, LAS: 0.8695, UEM: 0.5531, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5493, partial_loss/deprel_loss: 0.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7644, loss: 0.9168, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||: 11%|# | 10/95 [00:06<00:58, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9311, LAS: 0.8784, UEM: 0.5744, LEM: 0.3594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.5015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.8554, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||: 14%|#3 | 13/95 [00:09<00:57, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9310, LAS: 0.8779, UEM: 0.5689, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2638, partial_loss/deprel_loss: 0.4523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.8573, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||: 17%|#6 | 16/95 [00:11<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9345, LAS: 0.8821, UEM: 0.5764, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2498, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4943, loss: 0.8235, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9346, LAS: 0.8826, UEM: 0.5587, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9149, partial_loss/deprel_loss: 0.8323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0199, loss: 0.8256, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||: 24%|##4 | 23/95 [00:16<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9347, LAS: 0.8831, UEM: 0.6021, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9940, partial_loss/deprel_loss: 0.7965, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.8231, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||: 27%|##7 | 26/95 [00:18<00:52, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9344, LAS: 0.8825, UEM: 0.5849, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5843, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7773, loss: 0.8276, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||: 32%|###1 | 30/95 [00:21<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9317, LAS: 0.8796, UEM: 0.5668, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5949, partial_loss/deprel_loss: 0.6947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8460, loss: 0.8517, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||: 35%|###4 | 33/95 [00:23<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9325, LAS: 0.8805, UEM: 0.5634, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7286, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8771, loss: 0.8469, batch_reg_loss: 0.1713, reg_loss: 0.1711 ||: 39%|###8 | 37/95 [00:25<00:39, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9337, LAS: 0.8818, UEM: 0.5497, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4293, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7132, loss: 0.8384, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||: 43%|####3 | 41/95 [00:28<00:35, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9360, LAS: 0.8841, UEM: 0.5664, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3171, partial_loss/deprel_loss: 0.5417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6682, loss: 0.8215, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||: 47%|####7 | 45/95 [00:30<00:32, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9355, LAS: 0.8832, UEM: 0.5485, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7287, partial_loss/deprel_loss: 0.7702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9334, loss: 0.8286, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||: 52%|#####1 | 49/95 [00:33<00:29, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9374, LAS: 0.8854, UEM: 0.5735, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1057, partial_loss/deprel_loss: 0.2971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4304, loss: 0.8117, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||: 56%|#####5 | 53/95 [00:36<00:28, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9383, LAS: 0.8866, UEM: 0.5730, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3638, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5678, loss: 0.8014, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||: 60%|###### | 57/95 [00:38<00:25, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.9382, LAS: 0.8865, UEM: 0.5793, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3618, partial_loss/deprel_loss: 1.0481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2825, loss: 0.8016, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||: 64%|######4 | 61/95 [00:41<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9387, LAS: 0.8872, UEM: 0.5830, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.4606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.7965, batch_reg_loss: 0.1717, reg_loss: 0.1713 ||: 68%|######8 | 65/95 [00:44<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9388, LAS: 0.8873, UEM: 0.5816, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4330, partial_loss/deprel_loss: 0.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6816, loss: 0.7948, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||: 72%|#######1 | 68/95 [00:46<00:18, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9387, LAS: 0.8871, UEM: 0.5752, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5528, partial_loss/deprel_loss: 0.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7865, loss: 0.7976, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9384, LAS: 0.8868, UEM: 0.5740, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1857, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1115, loss: 0.8005, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9380, LAS: 0.8862, UEM: 0.5700, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7909, loss: 0.8065, batch_reg_loss: 0.1719, reg_loss: 0.1714 ||: 81%|########1 | 77/95 [00:53<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9381, LAS: 0.8863, UEM: 0.5635, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4670, partial_loss/deprel_loss: 0.6401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7774, loss: 0.8060, batch_reg_loss: 0.1719, reg_loss: 0.1714 ||: 85%|########5 | 81/95 [00:55<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9376, LAS: 0.8858, UEM: 0.5677, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.8091, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||: 88%|########8 | 84/95 [00:57<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9380, LAS: 0.8862, UEM: 0.5673, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6295, loss: 0.8062, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||: 92%|#########1| 87/95 [01:00<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8334, UAS: 0.9381, LAS: 0.8865, UEM: 0.5757, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3601, partial_loss/deprel_loss: 0.9394, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1956, loss: 0.8051, batch_reg_loss: 0.1721, reg_loss: 0.1714 ||: 95%|#########4| 90/95 [01:02<00:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9388, LAS: 0.8872, UEM: 0.5787, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5881, loss: 0.8000, batch_reg_loss: 0.1721, reg_loss: 0.1715 ||: 98%|#########7| 93/95 [01:04<00:01, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9392, LAS: 0.8877, UEM: 0.5798, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5817, loss: 0.7964, batch_reg_loss: 0.1722, reg_loss: 0.1715 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UEM | 0.580 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LEM | 0.338 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - EM | 0.915 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.307 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.435 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - loss | 0.796 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:06:06,257 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:06:06,257 - INFO - combo.training.trainer - Epoch duration: 0:01:06.240258\n", + "2023-04-07 00:06:06,257 - INFO - combo.training.trainer - Estimated training time remaining: 6:13:30\n", + "2023-04-07 00:06:06,257 - INFO - allennlp.training.trainer - Epoch 68/399\n", + "2023-04-07 00:06:06,258 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:06:06,258 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:06:06,265 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9587, LAS: 0.9139, UEM: 0.7856, LEM: 0.5824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.4504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.5819, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 3%|3 | 3/95 [00:02<01:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9519, LAS: 0.9063, UEM: 0.7001, LEM: 0.4794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1949, partial_loss/deprel_loss: 0.3622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.6616, batch_reg_loss: 0.1723, reg_loss: 0.1722 ||: 7%|7 | 7/95 [00:04<01:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9491, LAS: 0.9010, UEM: 0.6554, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3870, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6979, loss: 0.7004, batch_reg_loss: 0.1723, reg_loss: 0.1722 ||: 12%|#1 | 11/95 [00:07<01:01, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9410, LAS: 0.8914, UEM: 0.6062, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3762, partial_loss/deprel_loss: 0.4839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.7718, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 16%|#5 | 15/95 [00:10<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9450, LAS: 0.8954, UEM: 0.6326, LEM: 0.3857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2793, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.7440, batch_reg_loss: 0.1724, reg_loss: 0.1723 ||: 19%|#8 | 18/95 [00:12<00:54, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9463, LAS: 0.8969, UEM: 0.6529, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1125, partial_loss/deprel_loss: 0.2689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4100, loss: 0.7289, batch_reg_loss: 0.1724, reg_loss: 0.1723 ||: 22%|##2 | 21/95 [00:14<00:53, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9478, LAS: 0.8982, UEM: 0.6541, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.7217, batch_reg_loss: 0.1725, reg_loss: 0.1723 ||: 26%|##6 | 25/95 [00:17<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9481, LAS: 0.8985, UEM: 0.6538, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1610, partial_loss/deprel_loss: 0.3754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.7196, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||: 31%|### | 29/95 [00:19<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9472, LAS: 0.8979, UEM: 0.6350, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9341, partial_loss/deprel_loss: 0.7667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9727, loss: 0.7252, batch_reg_loss: 0.1726, reg_loss: 0.1724 ||: 35%|###4 | 33/95 [00:22<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9463, LAS: 0.8962, UEM: 0.6173, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4791, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 0.7406, batch_reg_loss: 0.1726, reg_loss: 0.1724 ||: 39%|###8 | 37/95 [00:24<00:38, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9454, LAS: 0.8949, UEM: 0.6123, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7145, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9511, loss: 0.7485, batch_reg_loss: 0.1727, reg_loss: 0.1724 ||: 43%|####3 | 41/95 [00:27<00:34, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9445, LAS: 0.8940, UEM: 0.5998, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3833, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.7572, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||: 47%|####7 | 45/95 [00:30<00:32, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9452, LAS: 0.8948, UEM: 0.6033, LEM: 0.3522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6803, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8344, loss: 0.7507, batch_reg_loss: 0.1728, reg_loss: 0.1725 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9437, LAS: 0.8933, UEM: 0.5970, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4687, partial_loss/deprel_loss: 0.5079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6729, loss: 0.7606, batch_reg_loss: 0.1729, reg_loss: 0.1725 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9430, LAS: 0.8921, UEM: 0.5866, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.6118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7549, loss: 0.7677, batch_reg_loss: 0.1729, reg_loss: 0.1725 ||: 59%|#####8 | 56/95 [00:37<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9418, LAS: 0.8908, UEM: 0.5768, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8159, partial_loss/deprel_loss: 0.7028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8984, loss: 0.7776, batch_reg_loss: 0.1730, reg_loss: 0.1726 ||: 63%|######3 | 60/95 [00:40<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9425, LAS: 0.8916, UEM: 0.5886, LEM: 0.3404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3835, partial_loss/deprel_loss: 0.4990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.7703, batch_reg_loss: 0.1731, reg_loss: 0.1726 ||: 67%|######7 | 64/95 [00:43<00:21, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9423, LAS: 0.8912, UEM: 0.5833, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6041, partial_loss/deprel_loss: 0.6684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8286, loss: 0.7740, batch_reg_loss: 0.1731, reg_loss: 0.1726 ||: 71%|####### | 67/95 [00:45<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9422, LAS: 0.8907, UEM: 0.5799, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7295, partial_loss/deprel_loss: 0.7300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9031, loss: 0.7775, batch_reg_loss: 0.1732, reg_loss: 0.1726 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9406, LAS: 0.8892, UEM: 0.5718, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3351, partial_loss/deprel_loss: 0.8683, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1349, loss: 0.7873, batch_reg_loss: 0.1732, reg_loss: 0.1727 ||: 78%|#######7 | 74/95 [00:50<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9409, LAS: 0.8895, UEM: 0.5731, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8301, loss: 0.7837, batch_reg_loss: 0.1733, reg_loss: 0.1727 ||: 81%|########1 | 77/95 [00:52<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9407, LAS: 0.8893, UEM: 0.5694, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1221, partial_loss/deprel_loss: 0.9179, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1321, loss: 0.7865, batch_reg_loss: 0.1733, reg_loss: 0.1727 ||: 85%|########5 | 81/95 [00:54<00:09, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9393, LAS: 0.8878, UEM: 0.5622, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4130, partial_loss/deprel_loss: 0.5317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6813, loss: 0.7980, batch_reg_loss: 0.1734, reg_loss: 0.1727 ||: 89%|########9 | 85/95 [00:57<00:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9388, LAS: 0.8872, UEM: 0.5587, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0143, partial_loss/deprel_loss: 0.9618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1458, loss: 0.8031, batch_reg_loss: 0.1735, reg_loss: 0.1728 ||: 94%|#########3| 89/95 [01:00<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9396, LAS: 0.8882, UEM: 0.5774, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0588, partial_loss/deprel_loss: 0.1635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3161, loss: 0.7969, batch_reg_loss: 0.1735, reg_loss: 0.1728 ||: 97%|#########6| 92/95 [01:03<00:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9393, LAS: 0.8879, UEM: 0.5786, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4150, partial_loss/deprel_loss: 0.9446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2123, loss: 0.7990, batch_reg_loss: 0.1736, reg_loss: 0.1728 ||: 100%|##########| 95/95 [01:05<00:00, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9393, LAS: 0.8879, UEM: 0.5786, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4150, partial_loss/deprel_loss: 0.9446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2123, loss: 0.7990, batch_reg_loss: 0.1736, reg_loss: 0.1728 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - LEM | 0.341 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - EM | 0.834 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.415 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.945 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - loss | 0.799 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:11,493 - INFO - combo.training.trainer - Epoch duration: 0:01:05.235624\n", + "2023-04-07 00:07:11,493 - INFO - combo.training.trainer - Estimated training time remaining: 6:12:11\n", + "2023-04-07 00:07:11,493 - INFO - allennlp.training.trainer - Epoch 69/399\n", + "2023-04-07 00:07:11,493 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:07:11,494 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:07:11,501 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9319, LAS: 0.8809, UEM: 0.4658, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2728, partial_loss/deprel_loss: 0.9373, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1780, loss: 0.8313, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||: 4%|4 | 4/95 [00:02<00:55, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9396, LAS: 0.8886, UEM: 0.5949, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.7732, batch_reg_loss: 0.1737, reg_loss: 0.1736 ||: 7%|7 | 7/95 [00:04<00:55, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9369, LAS: 0.8864, UEM: 0.6029, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.3749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.7978, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 11%|# | 10/95 [00:06<00:57, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9417, LAS: 0.8934, UEM: 0.6786, LEM: 0.4823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0577, partial_loss/deprel_loss: 0.1619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3148, loss: 0.7504, batch_reg_loss: 0.1738, reg_loss: 0.1737 ||: 14%|#3 | 13/95 [00:09<01:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9398, LAS: 0.8907, UEM: 0.6684, LEM: 0.4707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3221, partial_loss/deprel_loss: 0.9825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2242, loss: 0.7711, batch_reg_loss: 0.1738, reg_loss: 0.1737 ||: 17%|#6 | 16/95 [00:11<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9422, LAS: 0.8933, UEM: 0.6685, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.6860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8620, loss: 0.7529, batch_reg_loss: 0.1739, reg_loss: 0.1737 ||: 20%|## | 19/95 [00:13<00:54, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9447, LAS: 0.8956, UEM: 0.6852, LEM: 0.4695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2802, partial_loss/deprel_loss: 0.4948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7326, batch_reg_loss: 0.1739, reg_loss: 0.1737 ||: 23%|##3 | 22/95 [00:15<00:52, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9456, LAS: 0.8959, UEM: 0.6625, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3983, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7349, batch_reg_loss: 0.1739, reg_loss: 0.1738 ||: 27%|##7 | 26/95 [00:18<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9426, LAS: 0.8929, UEM: 0.6455, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3413, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7604, batch_reg_loss: 0.1740, reg_loss: 0.1738 ||: 32%|###1 | 30/95 [00:20<00:43, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9441, LAS: 0.8945, UEM: 0.6442, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3032, partial_loss/deprel_loss: 0.4812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6196, loss: 0.7508, batch_reg_loss: 0.1740, reg_loss: 0.1738 ||: 35%|###4 | 33/95 [00:23<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9453, LAS: 0.8956, UEM: 0.6464, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2720, partial_loss/deprel_loss: 0.4392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.7407, batch_reg_loss: 0.1741, reg_loss: 0.1738 ||: 38%|###7 | 36/95 [00:25<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9452, LAS: 0.8957, UEM: 0.6449, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2043, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.7421, batch_reg_loss: 0.1741, reg_loss: 0.1739 ||: 41%|####1 | 39/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9450, LAS: 0.8955, UEM: 0.6347, LEM: 0.3927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5268, partial_loss/deprel_loss: 0.6980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8379, loss: 0.7425, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||: 44%|####4 | 42/95 [00:29<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9453, LAS: 0.8959, UEM: 0.6375, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2734, partial_loss/deprel_loss: 0.4405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.7410, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||: 47%|####7 | 45/95 [00:31<00:36, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9439, LAS: 0.8945, UEM: 0.6269, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.7511, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||: 51%|##### | 48/95 [00:33<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9444, LAS: 0.8951, UEM: 0.6316, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4268, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6436, loss: 0.7477, batch_reg_loss: 0.1743, reg_loss: 0.1739 ||: 54%|#####3 | 51/95 [00:38<00:41, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9433, LAS: 0.8940, UEM: 0.6272, LEM: 0.3922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5344, loss: 0.7587, batch_reg_loss: 0.1743, reg_loss: 0.1740 ||: 57%|#####6 | 54/95 [00:40<00:35, 1.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9428, LAS: 0.8932, UEM: 0.6212, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.8650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0768, loss: 0.7622, batch_reg_loss: 0.1744, reg_loss: 0.1740 ||: 60%|###### | 57/95 [00:42<00:31, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9407, LAS: 0.8908, UEM: 0.6071, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5570, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.7790, batch_reg_loss: 0.1744, reg_loss: 0.1740 ||: 64%|######4 | 61/95 [00:45<00:26, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9403, LAS: 0.8903, UEM: 0.6131, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4550, loss: 0.7813, batch_reg_loss: 0.1745, reg_loss: 0.1740 ||: 67%|######7 | 64/95 [00:47<00:24, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9405, LAS: 0.8903, UEM: 0.6066, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7340, partial_loss/deprel_loss: 0.7126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8914, loss: 0.7835, batch_reg_loss: 0.1745, reg_loss: 0.1740 ||: 71%|####### | 67/95 [00:49<00:21, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9400, LAS: 0.8898, UEM: 0.5994, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1403, partial_loss/deprel_loss: 0.8225, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0606, loss: 0.7869, batch_reg_loss: 0.1746, reg_loss: 0.1741 ||: 75%|#######4 | 71/95 [00:52<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9404, LAS: 0.8902, UEM: 0.6003, LEM: 0.3654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2757, partial_loss/deprel_loss: 0.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.7836, batch_reg_loss: 0.1746, reg_loss: 0.1741 ||: 78%|#######7 | 74/95 [00:54<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9413, LAS: 0.8911, UEM: 0.6053, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6444, loss: 0.7775, batch_reg_loss: 0.1747, reg_loss: 0.1741 ||: 81%|########1 | 77/95 [00:56<00:13, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9409, LAS: 0.8904, UEM: 0.5997, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9304, partial_loss/deprel_loss: 0.9354, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1091, loss: 0.7823, batch_reg_loss: 0.1747, reg_loss: 0.1741 ||: 85%|########5 | 81/95 [00:59<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9223, UAS: 0.9405, LAS: 0.8899, UEM: 0.5967, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5691, loss: 0.7860, batch_reg_loss: 0.1748, reg_loss: 0.1742 ||: 88%|########8 | 84/95 [01:01<00:07, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9405, LAS: 0.8898, UEM: 0.5912, LEM: 0.3526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7375, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.7868, batch_reg_loss: 0.1748, reg_loss: 0.1742 ||: 92%|#########1| 87/95 [01:03<00:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9404, LAS: 0.8896, UEM: 0.5846, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5953, partial_loss/deprel_loss: 0.5995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7735, loss: 0.7882, batch_reg_loss: 0.1749, reg_loss: 0.1742 ||: 96%|#########5| 91/95 [01:06<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9403, LAS: 0.8894, UEM: 0.5817, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2989, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.7904, batch_reg_loss: 0.1749, reg_loss: 0.1742 ||: 99%|#########8| 94/95 [01:08<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9402, LAS: 0.8892, UEM: 0.5793, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8387, partial_loss/deprel_loss: 0.7951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.7924, batch_reg_loss: 0.1750, reg_loss: 0.1743 ||: 100%|##########| 95/95 [01:08<00:00, 1.38it/s]\n", + "2023-04-07 00:08:20,495 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - reg_loss | 0.174 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - LEM | 0.341 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EM | 0.872 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.839 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.795 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - loss | 0.792 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:20,497 - INFO - combo.training.trainer - Epoch duration: 0:01:09.004150\n", + "2023-04-07 00:08:20,498 - INFO - combo.training.trainer - Estimated training time remaining: 6:11:11\n", + "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - Epoch 70/399\n", + "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:08:20,505 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9491, LAS: 0.9010, UEM: 0.7922, LEM: 0.6567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0717, partial_loss/deprel_loss: 0.1955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3458, loss: 0.7096, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 3%|3 | 3/95 [00:02<01:19, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9440, LAS: 0.8947, UEM: 0.7003, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6981, partial_loss/deprel_loss: 0.7286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.7553, batch_reg_loss: 0.1751, reg_loss: 0.1750 ||: 6%|6 | 6/95 [00:04<01:13, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9396, LAS: 0.8888, UEM: 0.6422, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9106, partial_loss/deprel_loss: 0.7770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.8048, batch_reg_loss: 0.1751, reg_loss: 0.1750 ||: 9%|9 | 9/95 [00:06<01:06, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9413, LAS: 0.8906, UEM: 0.6105, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6072, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.7915, batch_reg_loss: 0.1752, reg_loss: 0.1751 ||: 13%|#2 | 12/95 [00:08<01:03, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9446, LAS: 0.8935, UEM: 0.6170, LEM: 0.3991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2828, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6582, loss: 0.7705, batch_reg_loss: 0.1752, reg_loss: 0.1751 ||: 16%|#5 | 15/95 [00:10<00:58, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9378, LAS: 0.8873, UEM: 0.5714, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6191, partial_loss/deprel_loss: 0.6607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8276, loss: 0.8160, batch_reg_loss: 0.1753, reg_loss: 0.1751 ||: 20%|## | 19/95 [00:13<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9368, LAS: 0.8858, UEM: 0.5476, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4515, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7370, loss: 0.8286, batch_reg_loss: 0.1753, reg_loss: 0.1751 ||: 23%|##3 | 22/95 [00:15<00:50, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9399, LAS: 0.8889, UEM: 0.5813, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1573, partial_loss/deprel_loss: 0.3624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4967, loss: 0.8035, batch_reg_loss: 0.1753, reg_loss: 0.1752 ||: 27%|##7 | 26/95 [00:17<00:46, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9405, LAS: 0.8898, UEM: 0.5877, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.4406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5911, loss: 0.7973, batch_reg_loss: 0.1754, reg_loss: 0.1752 ||: 32%|###1 | 30/95 [00:20<00:43, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9412, LAS: 0.8907, UEM: 0.5935, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8567, partial_loss/deprel_loss: 0.7805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9712, loss: 0.7906, batch_reg_loss: 0.1754, reg_loss: 0.1752 ||: 35%|###4 | 33/95 [00:22<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9419, LAS: 0.8914, UEM: 0.5897, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5001, partial_loss/deprel_loss: 0.5773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7373, loss: 0.7822, batch_reg_loss: 0.1755, reg_loss: 0.1752 ||: 38%|###7 | 36/95 [00:24<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9427, LAS: 0.8918, UEM: 0.5907, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5370, loss: 0.7771, batch_reg_loss: 0.1755, reg_loss: 0.1753 ||: 42%|####2 | 40/95 [00:27<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9419, LAS: 0.8912, UEM: 0.5871, LEM: 0.3507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0417, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.7813, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||: 45%|####5 | 43/95 [00:29<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9427, LAS: 0.8918, UEM: 0.5864, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4019, partial_loss/deprel_loss: 0.6446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7716, loss: 0.7764, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||: 48%|####8 | 46/95 [00:32<00:35, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9442, LAS: 0.8934, UEM: 0.6045, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.4484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.7629, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||: 52%|#####1 | 49/95 [00:34<00:34, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9450, LAS: 0.8945, UEM: 0.6186, LEM: 0.3756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4040, loss: 0.7553, batch_reg_loss: 0.1757, reg_loss: 0.1753 ||: 55%|#####4 | 52/95 [00:36<00:33, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9457, LAS: 0.8950, UEM: 0.6215, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4822, partial_loss/deprel_loss: 0.6509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7929, loss: 0.7510, batch_reg_loss: 0.1757, reg_loss: 0.1754 ||: 58%|#####7 | 55/95 [00:39<00:30, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9443, LAS: 0.8935, UEM: 0.6121, LEM: 0.3654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2571, partial_loss/deprel_loss: 0.9744, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2066, loss: 0.7650, batch_reg_loss: 0.1757, reg_loss: 0.1754 ||: 62%|######2 | 59/95 [00:41<00:25, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9436, LAS: 0.8929, UEM: 0.6058, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.5462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6857, loss: 0.7703, batch_reg_loss: 0.1758, reg_loss: 0.1754 ||: 65%|######5 | 62/95 [00:43<00:23, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9439, LAS: 0.8931, UEM: 0.6097, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1138, partial_loss/deprel_loss: 0.3408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4712, loss: 0.7681, batch_reg_loss: 0.1758, reg_loss: 0.1754 ||: 68%|######8 | 65/95 [00:45<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9446, LAS: 0.8938, UEM: 0.6160, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2118, partial_loss/deprel_loss: 0.4220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.7613, batch_reg_loss: 0.1759, reg_loss: 0.1754 ||: 72%|#######1 | 68/95 [00:48<00:19, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9449, LAS: 0.8940, UEM: 0.6113, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4066, partial_loss/deprel_loss: 0.5803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7214, loss: 0.7603, batch_reg_loss: 0.1759, reg_loss: 0.1755 ||: 76%|#######5 | 72/95 [00:50<00:16, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9450, LAS: 0.8938, UEM: 0.6085, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2725, partial_loss/deprel_loss: 0.5266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.7618, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||: 79%|#######8 | 75/95 [00:52<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8082, UAS: 0.9432, LAS: 0.8917, UEM: 0.5998, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6078, partial_loss/deprel_loss: 1.0781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3600, loss: 0.7772, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||: 83%|########3 | 79/95 [00:55<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9420, LAS: 0.8903, UEM: 0.5945, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8079, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9668, loss: 0.7864, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||: 86%|########6 | 82/95 [00:57<00:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9422, LAS: 0.8905, UEM: 0.5936, LEM: 0.3463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9196, partial_loss/deprel_loss: 0.8773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0618, loss: 0.7851, batch_reg_loss: 0.1761, reg_loss: 0.1756 ||: 89%|########9 | 85/95 [00:59<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9415, LAS: 0.8897, UEM: 0.5866, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1732, partial_loss/deprel_loss: 0.8958, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1274, loss: 0.7916, batch_reg_loss: 0.1762, reg_loss: 0.1756 ||: 94%|#########3| 89/95 [01:02<00:04, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9405, LAS: 0.8886, UEM: 0.5778, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2289, partial_loss/deprel_loss: 0.8653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1143, loss: 0.8000, batch_reg_loss: 0.1762, reg_loss: 0.1756 ||: 98%|#########7| 93/95 [01:04<00:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9406, LAS: 0.8886, UEM: 0.5797, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.3714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.7998, batch_reg_loss: 0.1763, reg_loss: 0.1756 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 00:09:27,115 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9153, LAS: 0.8558, UEM: 0.1908, LEM: 0.0526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4304, partial_loss/deprel_loss: 56.5432, partial_loss/cycle_loss: 0.0000, batch_loss: 45.5206, loss: 42.2261, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:10, 1.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9318, LAS: 0.8726, UEM: 0.3708, LEM: 0.0868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4709, partial_loss/deprel_loss: 23.6317, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9995, loss: 33.1798, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.08s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9432, LAS: 0.8868, UEM: 0.5980, LEM: 0.2941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 22.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1358, loss: 29.0568, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.08s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9457, LAS: 0.8899, UEM: 0.6081, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4233, partial_loss/deprel_loss: 28.9285, partial_loss/cycle_loss: 0.0000, batch_loss: 23.2275, loss: 27.2084, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9483, LAS: 0.8943, UEM: 0.6744, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2251, partial_loss/deprel_loss: 19.1517, partial_loss/cycle_loss: 0.0000, batch_loss: 15.3664, loss: 26.1318, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.06it/s]\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - reg_loss | 0.176 | 0.000\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - UEM | 0.580 | 0.674\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - LEM | 0.337 | 0.392\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EM | 0.927 | 0.938\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.190 | 0.225\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | 0.948\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.371 | 19.152\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - loss | 0.800 | 26.132\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | 0.894\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:37,461 - INFO - combo.training.trainer - Epoch duration: 0:01:16.963087\n", + "2023-04-07 00:09:37,461 - INFO - combo.training.trainer - Estimated training time remaining: 6:10:48\n", + "2023-04-07 00:09:37,461 - INFO - allennlp.training.trainer - Epoch 71/399\n", + "2023-04-07 00:09:37,461 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:09:37,462 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:09:37,469 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9552, LAS: 0.9068, UEM: 0.6813, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1733, partial_loss/deprel_loss: 0.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4515, loss: 0.6592, batch_reg_loss: 0.1763, reg_loss: 0.1763 ||: 4%|4 | 4/95 [00:02<00:54, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9475, LAS: 0.8981, UEM: 0.5787, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4932, partial_loss/deprel_loss: 0.6592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8024, loss: 0.7276, batch_reg_loss: 0.1764, reg_loss: 0.1763 ||: 8%|8 | 8/95 [00:04<00:50, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9581, UAS: 0.9502, LAS: 0.9021, UEM: 0.6920, LEM: 0.4880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0532, partial_loss/deprel_loss: 0.1633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3177, loss: 0.6972, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 12%|#1 | 11/95 [00:06<00:53, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8585, UAS: 0.9455, LAS: 0.8973, UEM: 0.6476, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9427, partial_loss/deprel_loss: 0.8309, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0298, loss: 0.7332, batch_reg_loss: 0.1765, reg_loss: 0.1764 ||: 16%|#5 | 15/95 [00:09<00:48, 1.64it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9403, LAS: 0.8910, UEM: 0.5839, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6263, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9107, loss: 0.7906, batch_reg_loss: 0.1766, reg_loss: 0.1764 ||: 21%|##1 | 20/95 [00:11<00:41, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9412, LAS: 0.8917, UEM: 0.5907, LEM: 0.3735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2732, partial_loss/deprel_loss: 0.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.7859, batch_reg_loss: 0.1767, reg_loss: 0.1765 ||: 26%|##6 | 25/95 [00:13<00:38, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9380, LAS: 0.8878, UEM: 0.5626, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5694, partial_loss/deprel_loss: 0.6708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.8117, batch_reg_loss: 0.1767, reg_loss: 0.1765 ||: 31%|### | 29/95 [00:16<00:38, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9386, LAS: 0.8881, UEM: 0.5534, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8262, loss: 0.8095, batch_reg_loss: 0.1768, reg_loss: 0.1765 ||: 35%|###4 | 33/95 [00:19<00:37, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9387, LAS: 0.8882, UEM: 0.5429, LEM: 0.3209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7026, partial_loss/deprel_loss: 0.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8647, loss: 0.8090, batch_reg_loss: 0.1768, reg_loss: 0.1766 ||: 39%|###8 | 37/95 [00:22<00:37, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8166, UAS: 0.9378, LAS: 0.8871, UEM: 0.5435, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5673, partial_loss/deprel_loss: 1.0897, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3621, loss: 0.8157, batch_reg_loss: 0.1769, reg_loss: 0.1766 ||: 43%|####3 | 41/95 [00:25<00:36, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9387, LAS: 0.8877, UEM: 0.5407, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.5889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7463, loss: 0.8124, batch_reg_loss: 0.1770, reg_loss: 0.1766 ||: 46%|####6 | 44/95 [00:27<00:34, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8346, UAS: 0.9389, LAS: 0.8879, UEM: 0.5550, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3078, partial_loss/deprel_loss: 0.9468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1960, loss: 0.8088, batch_reg_loss: 0.1770, reg_loss: 0.1766 ||: 49%|####9 | 47/95 [00:29<00:32, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9387, LAS: 0.8879, UEM: 0.5572, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0041, partial_loss/deprel_loss: 0.8890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0890, loss: 0.8090, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||: 53%|#####2 | 50/95 [00:31<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9385, LAS: 0.8875, UEM: 0.5519, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1688, partial_loss/deprel_loss: 0.9223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1487, loss: 0.8117, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||: 56%|#####5 | 53/95 [00:33<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9386, LAS: 0.8874, UEM: 0.5469, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.8119, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||: 59%|#####8 | 56/95 [00:35<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9388, LAS: 0.8876, UEM: 0.5448, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3204, partial_loss/deprel_loss: 0.4900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.8105, batch_reg_loss: 0.1772, reg_loss: 0.1767 ||: 62%|######2 | 59/95 [00:37<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9393, LAS: 0.8880, UEM: 0.5485, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4376, partial_loss/deprel_loss: 0.6354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7731, loss: 0.8058, batch_reg_loss: 0.1772, reg_loss: 0.1768 ||: 65%|######5 | 62/95 [00:40<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9400, LAS: 0.8888, UEM: 0.5493, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3143, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.8020, batch_reg_loss: 0.1773, reg_loss: 0.1768 ||: 69%|######9 | 66/95 [00:42<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9409, LAS: 0.8897, UEM: 0.5563, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.4179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5579, loss: 0.7938, batch_reg_loss: 0.1774, reg_loss: 0.1768 ||: 74%|#######3 | 70/95 [00:45<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9395, LAS: 0.8883, UEM: 0.5604, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.3368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4770, loss: 0.8039, batch_reg_loss: 0.1774, reg_loss: 0.1768 ||: 77%|#######6 | 73/95 [00:47<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9400, LAS: 0.8889, UEM: 0.5613, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5803, loss: 0.8009, batch_reg_loss: 0.1774, reg_loss: 0.1769 ||: 80%|######## | 76/95 [00:49<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9402, LAS: 0.8893, UEM: 0.5742, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1263, partial_loss/deprel_loss: 0.2588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4097, loss: 0.7961, batch_reg_loss: 0.1775, reg_loss: 0.1769 ||: 83%|########3 | 79/95 [00:51<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9397, LAS: 0.8887, UEM: 0.5725, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.8023, batch_reg_loss: 0.1775, reg_loss: 0.1769 ||: 87%|########7 | 83/95 [00:54<00:08, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9400, LAS: 0.8889, UEM: 0.5712, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3889, partial_loss/deprel_loss: 0.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8005, batch_reg_loss: 0.1776, reg_loss: 0.1769 ||: 91%|######### | 86/95 [00:56<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9400, LAS: 0.8890, UEM: 0.5667, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.5279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.7999, batch_reg_loss: 0.1776, reg_loss: 0.1770 ||: 94%|#########3| 89/95 [00:58<00:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9403, LAS: 0.8892, UEM: 0.5763, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2965, partial_loss/deprel_loss: 0.9069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1625, loss: 0.7979, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||: 97%|#########6| 92/95 [01:01<00:02, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9412, LAS: 0.8901, UEM: 0.5836, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2061, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.7915, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||: 100%|##########| 95/95 [01:03<00:00, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9412, LAS: 0.8901, UEM: 0.5836, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2061, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.7915, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - reg_loss | 0.177 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - LEM | 0.337 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EM | 0.918 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.206 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.436 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - loss | 0.792 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:10:41,103 - INFO - combo.training.trainer - Epoch duration: 0:01:03.641837\n", + "2023-04-07 00:10:41,103 - INFO - combo.training.trainer - Estimated training time remaining: 6:09:22\n", + "2023-04-07 00:10:41,103 - INFO - allennlp.training.trainer - Epoch 72/399\n", + "2023-04-07 00:10:41,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:10:41,104 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:10:41,111 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9448, LAS: 0.8959, UEM: 0.6095, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2510, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5284, loss: 0.7326, batch_reg_loss: 0.1778, reg_loss: 0.1777 ||: 4%|4 | 4/95 [00:02<00:59, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9388, LAS: 0.8880, UEM: 0.5319, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0482, partial_loss/deprel_loss: 0.8046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0311, loss: 0.8022, batch_reg_loss: 0.1778, reg_loss: 0.1778 ||: 7%|7 | 7/95 [00:04<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9419, LAS: 0.8927, UEM: 0.5798, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7500, partial_loss/deprel_loss: 0.7594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9353, loss: 0.7699, batch_reg_loss: 0.1778, reg_loss: 0.1778 ||: 11%|# | 10/95 [00:06<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9388, LAS: 0.8894, UEM: 0.5484, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6365, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8131, loss: 0.7911, batch_reg_loss: 0.1779, reg_loss: 0.1778 ||: 14%|#3 | 13/95 [00:08<00:55, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9358, LAS: 0.8860, UEM: 0.4914, LEM: 0.2684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7931, loss: 0.8190, batch_reg_loss: 0.1779, reg_loss: 0.1778 ||: 18%|#7 | 17/95 [00:11<00:51, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9401, LAS: 0.8908, UEM: 0.5316, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.4793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6397, loss: 0.7893, batch_reg_loss: 0.1780, reg_loss: 0.1778 ||: 21%|##1 | 20/95 [00:13<00:50, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9426, LAS: 0.8931, UEM: 0.5414, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.5793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7344, loss: 0.7734, batch_reg_loss: 0.1780, reg_loss: 0.1779 ||: 25%|##5 | 24/95 [00:16<00:47, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9434, LAS: 0.8941, UEM: 0.5586, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4896, loss: 0.7642, batch_reg_loss: 0.1781, reg_loss: 0.1779 ||: 29%|##9 | 28/95 [00:18<00:44, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9452, LAS: 0.8960, UEM: 0.5764, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3343, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6497, loss: 0.7491, batch_reg_loss: 0.1781, reg_loss: 0.1779 ||: 33%|###2 | 31/95 [00:21<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9472, LAS: 0.8988, UEM: 0.6355, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1090, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.7275, batch_reg_loss: 0.1782, reg_loss: 0.1780 ||: 36%|###5 | 34/95 [00:23<00:46, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9472, LAS: 0.8983, UEM: 0.6318, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4965, loss: 0.7297, batch_reg_loss: 0.1782, reg_loss: 0.1780 ||: 40%|#### | 38/95 [00:26<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9472, LAS: 0.8981, UEM: 0.6233, LEM: 0.3842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5991, partial_loss/deprel_loss: 0.7210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8749, loss: 0.7319, batch_reg_loss: 0.1783, reg_loss: 0.1780 ||: 45%|####5 | 43/95 [00:28<00:33, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9457, LAS: 0.8964, UEM: 0.6122, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8049, loss: 0.7461, batch_reg_loss: 0.1783, reg_loss: 0.1780 ||: 49%|####9 | 47/95 [00:30<00:28, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8240, UAS: 0.9435, LAS: 0.8936, UEM: 0.6103, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4303, partial_loss/deprel_loss: 1.0489, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3035, loss: 0.7667, batch_reg_loss: 0.1783, reg_loss: 0.1781 ||: 55%|#####4 | 52/95 [00:33<00:24, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9451, LAS: 0.8952, UEM: 0.6205, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.5809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.7555, batch_reg_loss: 0.1784, reg_loss: 0.1781 ||: 60%|###### | 57/95 [00:35<00:20, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9441, LAS: 0.8940, UEM: 0.6165, LEM: 0.3692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3280, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.7638, batch_reg_loss: 0.1785, reg_loss: 0.1781 ||: 64%|######4 | 61/95 [00:38<00:18, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9427, LAS: 0.8925, UEM: 0.6059, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8219, partial_loss/deprel_loss: 0.7629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9532, loss: 0.7773, batch_reg_loss: 0.1785, reg_loss: 0.1781 ||: 68%|######8 | 65/95 [00:40<00:17, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9424, LAS: 0.8920, UEM: 0.6026, LEM: 0.3569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4567, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7550, loss: 0.7816, batch_reg_loss: 0.1786, reg_loss: 0.1782 ||: 73%|#######2 | 69/95 [00:43<00:15, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9406, LAS: 0.8899, UEM: 0.5935, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3250, partial_loss/deprel_loss: 0.4898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6355, loss: 0.7957, batch_reg_loss: 0.1787, reg_loss: 0.1782 ||: 77%|#######6 | 73/95 [00:45<00:13, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9418, LAS: 0.8913, UEM: 0.6129, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3080, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.7826, batch_reg_loss: 0.1787, reg_loss: 0.1782 ||: 81%|########1 | 77/95 [00:49<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9415, LAS: 0.8906, UEM: 0.6072, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7716, partial_loss/deprel_loss: 0.8624, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0230, loss: 0.7860, batch_reg_loss: 0.1788, reg_loss: 0.1782 ||: 85%|########5 | 81/95 [00:51<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9410, LAS: 0.8898, UEM: 0.5993, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.6528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.7914, batch_reg_loss: 0.1789, reg_loss: 0.1783 ||: 89%|########9 | 85/95 [00:54<00:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9406, LAS: 0.8895, UEM: 0.5951, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0214, partial_loss/deprel_loss: 0.9291, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1265, loss: 0.7949, batch_reg_loss: 0.1789, reg_loss: 0.1783 ||: 94%|#########3| 89/95 [00:57<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9398, LAS: 0.8886, UEM: 0.5865, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 0.6854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8863, loss: 0.8020, batch_reg_loss: 0.1790, reg_loss: 0.1783 ||: 98%|#########7| 93/95 [00:59<00:01, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9399, LAS: 0.8888, UEM: 0.5849, LEM: 0.3435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4183, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6715, loss: 0.8009, batch_reg_loss: 0.1790, reg_loss: 0.1783 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - reg_loss | 0.178 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UEM | 0.585 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - LEM | 0.343 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EM | 0.909 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.418 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.511 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:42,409 - INFO - combo.training.trainer - Epoch duration: 0:01:01.305670\n", + "2023-04-07 00:11:42,409 - INFO - combo.training.trainer - Estimated training time remaining: 6:07:46\n", + "2023-04-07 00:11:42,409 - INFO - allennlp.training.trainer - Epoch 73/399\n", + "2023-04-07 00:11:42,409 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:11:42,410 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:11:42,416 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9595, LAS: 0.9081, UEM: 0.6650, LEM: 0.3547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3901, partial_loss/deprel_loss: 0.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6354, loss: 0.6435, batch_reg_loss: 0.1791, reg_loss: 0.1790 ||: 3%|3 | 3/95 [00:02<01:14, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9484, LAS: 0.8968, UEM: 0.5682, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0665, partial_loss/deprel_loss: 0.8109, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0411, loss: 0.7307, batch_reg_loss: 0.1791, reg_loss: 0.1791 ||: 6%|6 | 6/95 [00:04<01:09, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9421, LAS: 0.8909, UEM: 0.5965, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2777, partial_loss/deprel_loss: 0.9002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1549, loss: 0.7789, batch_reg_loss: 0.1791, reg_loss: 0.1791 ||: 9%|9 | 9/95 [00:06<01:07, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9485, LAS: 0.8981, UEM: 0.6525, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3354, partial_loss/deprel_loss: 0.4767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6276, loss: 0.7280, batch_reg_loss: 0.1792, reg_loss: 0.1791 ||: 13%|#2 | 12/95 [00:08<01:02, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9463, LAS: 0.8966, UEM: 0.6072, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0163, partial_loss/deprel_loss: 0.8169, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.7424, batch_reg_loss: 0.1792, reg_loss: 0.1791 ||: 17%|#6 | 16/95 [00:11<00:55, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9420, LAS: 0.8917, UEM: 0.6009, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.4819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.7828, batch_reg_loss: 0.1793, reg_loss: 0.1792 ||: 20%|## | 19/95 [00:13<00:53, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9395, LAS: 0.8894, UEM: 0.5673, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7418, partial_loss/deprel_loss: 0.6360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8364, loss: 0.7981, batch_reg_loss: 0.1793, reg_loss: 0.1792 ||: 23%|##3 | 22/95 [00:15<00:51, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9423, LAS: 0.8924, UEM: 0.5907, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.4751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6177, loss: 0.7735, batch_reg_loss: 0.1794, reg_loss: 0.1792 ||: 26%|##6 | 25/95 [00:17<00:51, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9420, LAS: 0.8923, UEM: 0.5727, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9474, partial_loss/deprel_loss: 0.7746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9886, loss: 0.7773, batch_reg_loss: 0.1794, reg_loss: 0.1792 ||: 29%|##9 | 28/95 [00:20<00:48, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9428, LAS: 0.8931, UEM: 0.5892, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.7717, batch_reg_loss: 0.1795, reg_loss: 0.1792 ||: 33%|###2 | 31/95 [00:22<00:46, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9407, LAS: 0.8906, UEM: 0.5706, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.5962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.7909, batch_reg_loss: 0.1795, reg_loss: 0.1793 ||: 37%|###6 | 35/95 [00:24<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9390, LAS: 0.8885, UEM: 0.5531, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6376, partial_loss/deprel_loss: 0.7715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9243, loss: 0.8063, batch_reg_loss: 0.1796, reg_loss: 0.1793 ||: 40%|#### | 38/95 [00:26<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9380, LAS: 0.8873, UEM: 0.5584, LEM: 0.3126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4264, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7118, loss: 0.8124, batch_reg_loss: 0.1796, reg_loss: 0.1793 ||: 43%|####3 | 41/95 [00:29<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9383, LAS: 0.8877, UEM: 0.5571, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2281, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5802, loss: 0.8078, batch_reg_loss: 0.1797, reg_loss: 0.1793 ||: 47%|####7 | 45/95 [00:31<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9362, LAS: 0.8857, UEM: 0.5522, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1931, partial_loss/deprel_loss: 0.8665, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8223, batch_reg_loss: 0.1797, reg_loss: 0.1794 ||: 51%|##### | 48/95 [00:33<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9368, LAS: 0.8861, UEM: 0.5426, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5555, partial_loss/deprel_loss: 0.6462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 0.8225, batch_reg_loss: 0.1798, reg_loss: 0.1794 ||: 55%|#####4 | 52/95 [00:36<00:29, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9379, LAS: 0.8875, UEM: 0.5514, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2471, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.8107, batch_reg_loss: 0.1799, reg_loss: 0.1794 ||: 59%|#####8 | 56/95 [00:38<00:25, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9389, LAS: 0.8886, UEM: 0.5519, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6545, partial_loss/deprel_loss: 0.6234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8095, loss: 0.8024, batch_reg_loss: 0.1799, reg_loss: 0.1795 ||: 63%|######3 | 60/95 [00:41<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9393, LAS: 0.8887, UEM: 0.5533, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 0.8101, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0233, loss: 0.8015, batch_reg_loss: 0.1800, reg_loss: 0.1795 ||: 67%|######7 | 64/95 [00:44<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9405, LAS: 0.8903, UEM: 0.5824, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0535, partial_loss/deprel_loss: 0.1670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3243, loss: 0.7917, batch_reg_loss: 0.1800, reg_loss: 0.1795 ||: 71%|####### | 67/95 [00:46<00:20, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9412, LAS: 0.8909, UEM: 0.5884, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3541, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.7866, batch_reg_loss: 0.1801, reg_loss: 0.1795 ||: 74%|#######3 | 70/95 [00:49<00:18, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9411, LAS: 0.8908, UEM: 0.5868, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3168, partial_loss/deprel_loss: 0.5028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.7875, batch_reg_loss: 0.1801, reg_loss: 0.1796 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9412, LAS: 0.8907, UEM: 0.5859, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4250, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1944, loss: 0.7883, batch_reg_loss: 0.1801, reg_loss: 0.1796 ||: 83%|########3 | 79/95 [00:53<00:10, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9408, LAS: 0.8901, UEM: 0.5766, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4056, partial_loss/deprel_loss: 0.5294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6848, loss: 0.7940, batch_reg_loss: 0.1802, reg_loss: 0.1796 ||: 88%|########8 | 84/95 [00:55<00:06, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9403, LAS: 0.8895, UEM: 0.5670, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6572, partial_loss/deprel_loss: 0.7248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8915, loss: 0.7981, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||: 94%|#########3| 89/95 [00:57<00:03, 1.92it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9404, LAS: 0.8896, UEM: 0.5810, LEM: 0.3396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9609, partial_loss/deprel_loss: 0.8782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0751, loss: 0.7993, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||: 99%|#########8| 94/95 [01:01<00:00, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9407, LAS: 0.8899, UEM: 0.5840, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2879, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.7969, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - reg_loss | 0.180 | N/A\n", + "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LEM | 0.342 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - EM | 0.920 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.288 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.420 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - loss | 0.797 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:12:44,470 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:44,470 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:44,470 - INFO - combo.training.trainer - Epoch duration: 0:01:02.061214\n", + "2023-04-07 00:12:44,470 - INFO - combo.training.trainer - Estimated training time remaining: 6:06:15\n", + "2023-04-07 00:12:44,470 - INFO - allennlp.training.trainer - Epoch 74/399\n", + "2023-04-07 00:12:44,471 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:12:44,471 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:12:44,478 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9161, LAS: 0.8671, UEM: 0.3030, LEM: 0.1145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3191, partial_loss/deprel_loss: 0.8518, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1257, loss: 0.9598, batch_reg_loss: 0.1804, reg_loss: 0.1804 ||: 3%|3 | 3/95 [00:02<01:02, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9306, LAS: 0.8803, UEM: 0.4575, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.4430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5899, loss: 0.8639, batch_reg_loss: 0.1804, reg_loss: 0.1804 ||: 7%|7 | 7/95 [00:04<01:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9281, LAS: 0.8758, UEM: 0.4062, LEM: 0.1898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1880, partial_loss/deprel_loss: 0.8916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1314, loss: 0.9038, batch_reg_loss: 0.1805, reg_loss: 0.1804 ||: 12%|#1 | 11/95 [00:07<00:55, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9358, LAS: 0.8859, UEM: 0.5790, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0826, partial_loss/deprel_loss: 0.1733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.8216, batch_reg_loss: 0.1806, reg_loss: 0.1805 ||: 16%|#5 | 15/95 [00:10<00:55, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9374, LAS: 0.8873, UEM: 0.5968, LEM: 0.3911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8965, partial_loss/deprel_loss: 0.7724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9778, loss: 0.8044, batch_reg_loss: 0.1806, reg_loss: 0.1805 ||: 19%|#8 | 18/95 [00:12<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9352, LAS: 0.8850, UEM: 0.5647, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6314, partial_loss/deprel_loss: 0.6904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8593, loss: 0.8253, batch_reg_loss: 0.1807, reg_loss: 0.1805 ||: 22%|##2 | 21/95 [00:14<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9381, LAS: 0.8877, UEM: 0.5643, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6442, partial_loss/deprel_loss: 0.7299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.8088, batch_reg_loss: 0.1807, reg_loss: 0.1805 ||: 26%|##6 | 25/95 [00:17<00:48, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9391, LAS: 0.8887, UEM: 0.5723, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.8021, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||: 29%|##9 | 28/95 [00:19<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9377, LAS: 0.8867, UEM: 0.5533, LEM: 0.3328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5782, partial_loss/deprel_loss: 0.7032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8590, loss: 0.8184, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||: 33%|###2 | 31/95 [00:21<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9377, LAS: 0.8864, UEM: 0.5491, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3226, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6222, loss: 0.8197, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||: 36%|###5 | 34/95 [00:23<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8779, UAS: 0.9379, LAS: 0.8863, UEM: 0.5474, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6239, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 0.8200, batch_reg_loss: 0.1809, reg_loss: 0.1806 ||: 39%|###8 | 37/95 [00:25<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9380, LAS: 0.8861, UEM: 0.5464, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 0.4376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.8221, batch_reg_loss: 0.1809, reg_loss: 0.1806 ||: 42%|####2 | 40/95 [00:28<00:40, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9390, LAS: 0.8873, UEM: 0.5618, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5021, partial_loss/deprel_loss: 0.5595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7290, loss: 0.8097, batch_reg_loss: 0.1810, reg_loss: 0.1807 ||: 45%|####5 | 43/95 [00:30<00:37, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9395, LAS: 0.8878, UEM: 0.5577, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6855, loss: 0.8060, batch_reg_loss: 0.1810, reg_loss: 0.1807 ||: 48%|####8 | 46/95 [00:32<00:35, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9396, LAS: 0.8876, UEM: 0.5527, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7582, partial_loss/deprel_loss: 0.7119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9023, loss: 0.8061, batch_reg_loss: 0.1811, reg_loss: 0.1807 ||: 52%|#####1 | 49/95 [00:34<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9400, LAS: 0.8881, UEM: 0.5570, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1542, partial_loss/deprel_loss: 0.9661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1848, loss: 0.8046, batch_reg_loss: 0.1811, reg_loss: 0.1807 ||: 55%|#####4 | 52/95 [00:37<00:31, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9407, LAS: 0.8887, UEM: 0.5609, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2055, partial_loss/deprel_loss: 0.4421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.8005, batch_reg_loss: 0.1811, reg_loss: 0.1808 ||: 58%|#####7 | 55/95 [00:39<00:28, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9409, LAS: 0.8892, UEM: 0.5680, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5210, partial_loss/deprel_loss: 0.6415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 0.7969, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||: 61%|######1 | 58/95 [00:41<00:26, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9396, LAS: 0.8878, UEM: 0.5615, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5982, partial_loss/deprel_loss: 0.6778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8431, loss: 0.8095, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||: 64%|######4 | 61/95 [00:43<00:24, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9401, LAS: 0.8883, UEM: 0.5663, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1634, partial_loss/deprel_loss: 0.3427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.8067, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||: 67%|######7 | 64/95 [00:45<00:22, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9403, LAS: 0.8884, UEM: 0.5733, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5623, partial_loss/deprel_loss: 0.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8385, loss: 0.8059, batch_reg_loss: 0.1813, reg_loss: 0.1808 ||: 71%|####### | 67/95 [00:47<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9399, LAS: 0.8881, UEM: 0.5782, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2383, partial_loss/deprel_loss: 0.4386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.8079, batch_reg_loss: 0.1813, reg_loss: 0.1809 ||: 74%|#######3 | 70/95 [00:49<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9409, LAS: 0.8893, UEM: 0.5934, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.7988, batch_reg_loss: 0.1814, reg_loss: 0.1809 ||: 77%|#######6 | 73/95 [00:51<00:15, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8297, UAS: 0.9406, LAS: 0.8888, UEM: 0.5909, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3382, partial_loss/deprel_loss: 0.9632, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2196, loss: 0.8014, batch_reg_loss: 0.1814, reg_loss: 0.1809 ||: 81%|########1 | 77/95 [00:54<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9407, LAS: 0.8889, UEM: 0.5936, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.5269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7998, batch_reg_loss: 0.1815, reg_loss: 0.1809 ||: 84%|########4 | 80/95 [00:56<00:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9410, LAS: 0.8892, UEM: 0.5885, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4599, partial_loss/deprel_loss: 0.5396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.7969, batch_reg_loss: 0.1815, reg_loss: 0.1810 ||: 88%|########8 | 84/95 [00:59<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9411, LAS: 0.8891, UEM: 0.5851, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9966, partial_loss/deprel_loss: 0.9497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1407, loss: 0.7987, batch_reg_loss: 0.1816, reg_loss: 0.1810 ||: 93%|#########2| 88/95 [01:02<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9414, LAS: 0.8894, UEM: 0.5865, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2723, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5572, loss: 0.7953, batch_reg_loss: 0.1816, reg_loss: 0.1810 ||: 96%|#########5| 91/95 [01:04<00:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9406, LAS: 0.8885, UEM: 0.5807, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.8012, batch_reg_loss: 0.1817, reg_loss: 0.1810 ||: 100%|##########| 95/95 [01:06<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9406, LAS: 0.8885, UEM: 0.5807, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.8012, batch_reg_loss: 0.1817, reg_loss: 0.1810 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-07 00:13:51,409 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - reg_loss | 0.181 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UEM | 0.581 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - LEM | 0.337 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EM | 0.910 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.328 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.495 | N/A\n", + "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:13:51,412 - INFO - combo.training.trainer - Epoch duration: 0:01:06.941094\n", + "2023-04-07 00:13:51,412 - INFO - combo.training.trainer - Estimated training time remaining: 6:05:05\n", + "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - Epoch 75/399\n", + "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:13:51,419 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9098, LAS: 0.8622, UEM: 0.0877, LEM: 0.0132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1153, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0131, loss: 0.9803, batch_reg_loss: 0.1817, reg_loss: 0.1817 ||: 3%|3 | 3/95 [00:02<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9272, LAS: 0.8776, UEM: 0.3059, LEM: 0.1173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6280, partial_loss/deprel_loss: 0.6272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8091, loss: 0.8778, batch_reg_loss: 0.1817, reg_loss: 0.1817 ||: 6%|6 | 6/95 [00:04<01:01, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9345, LAS: 0.8839, UEM: 0.3528, LEM: 0.1280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4540, partial_loss/deprel_loss: 0.5823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7384, loss: 0.8420, batch_reg_loss: 0.1818, reg_loss: 0.1817 ||: 11%|# | 10/95 [00:06<00:55, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9377, LAS: 0.8877, UEM: 0.4580, LEM: 0.2246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2667, partial_loss/deprel_loss: 0.5394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6667, loss: 0.8077, batch_reg_loss: 0.1819, reg_loss: 0.1818 ||: 16%|#5 | 15/95 [00:08<00:47, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9347, LAS: 0.8835, UEM: 0.4359, LEM: 0.2086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4911, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8011, loss: 0.8421, batch_reg_loss: 0.1819, reg_loss: 0.1818 ||: 21%|##1 | 20/95 [00:11<00:41, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9372, LAS: 0.8859, UEM: 0.4520, LEM: 0.2106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7598, partial_loss/deprel_loss: 0.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8985, loss: 0.8208, batch_reg_loss: 0.1820, reg_loss: 0.1818 ||: 26%|##6 | 25/95 [00:13<00:35, 1.95it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9382, LAS: 0.8873, UEM: 0.5193, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5604, loss: 0.8099, batch_reg_loss: 0.1821, reg_loss: 0.1819 ||: 32%|###1 | 30/95 [00:15<00:32, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9392, LAS: 0.8884, UEM: 0.5258, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.5791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.8038, batch_reg_loss: 0.1822, reg_loss: 0.1819 ||: 36%|###5 | 34/95 [00:17<00:31, 1.94it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9396, LAS: 0.8886, UEM: 0.5388, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1500, partial_loss/deprel_loss: 0.8686, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1071, loss: 0.8017, batch_reg_loss: 0.1822, reg_loss: 0.1819 ||: 40%|#### | 38/95 [00:20<00:34, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9409, LAS: 0.8901, UEM: 0.5459, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8091, loss: 0.7930, batch_reg_loss: 0.1823, reg_loss: 0.1820 ||: 44%|####4 | 42/95 [00:23<00:33, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8711, UAS: 0.9402, LAS: 0.8892, UEM: 0.5421, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6804, partial_loss/deprel_loss: 0.7860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9472, loss: 0.7997, batch_reg_loss: 0.1823, reg_loss: 0.1820 ||: 48%|####8 | 46/95 [00:26<00:32, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9410, LAS: 0.8900, UEM: 0.5659, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.4134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.7930, batch_reg_loss: 0.1824, reg_loss: 0.1820 ||: 53%|#####2 | 50/95 [00:29<00:30, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7834, UAS: 0.9403, LAS: 0.8895, UEM: 0.5902, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0890, partial_loss/deprel_loss: 1.1278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5024, loss: 0.7955, batch_reg_loss: 0.1824, reg_loss: 0.1821 ||: 57%|#####6 | 54/95 [00:32<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9410, LAS: 0.8903, UEM: 0.5907, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.5865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7904, batch_reg_loss: 0.1825, reg_loss: 0.1821 ||: 60%|###### | 57/95 [00:35<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9407, LAS: 0.8899, UEM: 0.5785, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3906, partial_loss/deprel_loss: 0.5374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7937, batch_reg_loss: 0.1825, reg_loss: 0.1821 ||: 64%|######4 | 61/95 [00:37<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9415, LAS: 0.8906, UEM: 0.5929, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4893, loss: 0.7883, batch_reg_loss: 0.1826, reg_loss: 0.1821 ||: 67%|######7 | 64/95 [00:39<00:22, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9421, LAS: 0.8914, UEM: 0.6002, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2630, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5620, loss: 0.7812, batch_reg_loss: 0.1826, reg_loss: 0.1821 ||: 71%|####### | 67/95 [00:42<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9420, LAS: 0.8914, UEM: 0.5963, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3357, partial_loss/deprel_loss: 0.8577, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.7819, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||: 75%|#######4 | 71/95 [00:44<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9426, LAS: 0.8922, UEM: 0.6031, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2671, partial_loss/deprel_loss: 0.3893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5476, loss: 0.7760, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||: 78%|#######7 | 74/95 [00:47<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9417, LAS: 0.8911, UEM: 0.5919, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9803, partial_loss/deprel_loss: 0.8861, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0877, loss: 0.7840, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||: 82%|########2 | 78/95 [00:49<00:11, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9425, LAS: 0.8920, UEM: 0.5974, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3638, partial_loss/deprel_loss: 0.4613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6246, loss: 0.7768, batch_reg_loss: 0.1828, reg_loss: 0.1822 ||: 85%|########5 | 81/95 [00:51<00:10, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8313, UAS: 0.9422, LAS: 0.8917, UEM: 0.5951, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4579, partial_loss/deprel_loss: 0.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2073, loss: 0.7794, batch_reg_loss: 0.1828, reg_loss: 0.1823 ||: 88%|########8 | 84/95 [00:54<00:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9420, LAS: 0.8915, UEM: 0.5913, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7022, partial_loss/deprel_loss: 0.7376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9134, loss: 0.7813, batch_reg_loss: 0.1828, reg_loss: 0.1823 ||: 92%|#########1| 87/95 [00:56<00:05, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9407, LAS: 0.8900, UEM: 0.5821, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0682, partial_loss/deprel_loss: 0.8623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0864, loss: 0.7937, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||: 96%|#########5| 91/95 [00:58<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9406, LAS: 0.8899, UEM: 0.5845, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1381, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.7951, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||: 100%|##########| 95/95 [01:01<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9406, LAS: 0.8899, UEM: 0.5845, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1381, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.7951, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 00:14:53,028 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9663, LAS: 0.9206, UEM: 0.8083, LEM: 0.5614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4550, partial_loss/deprel_loss: 28.7498, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0908, loss: 20.1704, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9597, LAS: 0.9119, UEM: 0.7813, LEM: 0.5211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2073, partial_loss/deprel_loss: 22.4669, partial_loss/cycle_loss: 0.0000, batch_loss: 18.0150, loss: 20.2816, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9470, LAS: 0.8946, UEM: 0.7130, LEM: 0.4618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0117, partial_loss/deprel_loss: 43.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 34.8180, loss: 25.7831, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.00s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9468, LAS: 0.8939, UEM: 0.6769, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 24.0904, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3541, loss: 26.5160, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9475, LAS: 0.8947, UEM: 0.6682, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 23.4807, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8884, loss: 25.8226, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02it/s]\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - reg_loss | 0.182 | 0.000\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | 0.668\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - LEM | 0.340 | 0.398\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EM | 0.922 | 0.902\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.138 | 0.519\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | 0.947\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.345 | 23.481\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - loss | 0.795 | 25.823\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | 0.895\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:15:03,820 - INFO - combo.training.trainer - Epoch duration: 0:01:12.408039\n", + "2023-04-07 00:15:03,820 - INFO - combo.training.trainer - Estimated training time remaining: 6:04:19\n", + "2023-04-07 00:15:03,820 - INFO - allennlp.training.trainer - Epoch 76/399\n", + "2023-04-07 00:15:03,820 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:15:03,821 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:15:03,827 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9547, LAS: 0.9081, UEM: 0.5728, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.4644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.6572, batch_reg_loss: 0.1830, reg_loss: 0.1830 ||: 3%|3 | 3/95 [00:02<01:08, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9568, LAS: 0.9083, UEM: 0.6590, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1612, partial_loss/deprel_loss: 0.3406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6524, batch_reg_loss: 0.1831, reg_loss: 0.1830 ||: 7%|7 | 7/95 [00:04<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9493, LAS: 0.8998, UEM: 0.6395, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.5381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7173, loss: 0.7159, batch_reg_loss: 0.1831, reg_loss: 0.1830 ||: 11%|# | 10/95 [00:07<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9520, LAS: 0.9034, UEM: 0.6523, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3222, partial_loss/deprel_loss: 0.5445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.6955, batch_reg_loss: 0.1831, reg_loss: 0.1831 ||: 14%|#3 | 13/95 [00:09<00:59, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9500, LAS: 0.9006, UEM: 0.6224, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3848, partial_loss/deprel_loss: 0.5336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.7136, batch_reg_loss: 0.1832, reg_loss: 0.1831 ||: 17%|#6 | 16/95 [00:11<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9455, LAS: 0.8956, UEM: 0.5912, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9029, partial_loss/deprel_loss: 0.7841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9911, loss: 0.7523, batch_reg_loss: 0.1832, reg_loss: 0.1831 ||: 21%|##1 | 20/95 [00:14<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9457, LAS: 0.8952, UEM: 0.5852, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7514, partial_loss/deprel_loss: 0.6884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8843, loss: 0.7547, batch_reg_loss: 0.1833, reg_loss: 0.1831 ||: 24%|##4 | 23/95 [00:16<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9466, LAS: 0.8961, UEM: 0.5951, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.6079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7427, batch_reg_loss: 0.1833, reg_loss: 0.1831 ||: 27%|##7 | 26/95 [00:18<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9473, LAS: 0.8969, UEM: 0.5933, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6708, partial_loss/deprel_loss: 0.6070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8031, loss: 0.7368, batch_reg_loss: 0.1833, reg_loss: 0.1832 ||: 31%|### | 29/95 [00:20<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9449, LAS: 0.8939, UEM: 0.5724, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5364, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 0.7615, batch_reg_loss: 0.1834, reg_loss: 0.1832 ||: 35%|###4 | 33/95 [00:22<00:39, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9462, LAS: 0.8961, UEM: 0.6060, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4429, partial_loss/deprel_loss: 0.5341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6993, loss: 0.7474, batch_reg_loss: 0.1834, reg_loss: 0.1832 ||: 39%|###8 | 37/95 [00:24<00:35, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9435, LAS: 0.8931, UEM: 0.5781, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7130, partial_loss/deprel_loss: 0.7432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9206, loss: 0.7751, batch_reg_loss: 0.1835, reg_loss: 0.1832 ||: 44%|####4 | 42/95 [00:26<00:30, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9434, LAS: 0.8932, UEM: 0.5714, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2446, partial_loss/deprel_loss: 0.4314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5776, loss: 0.7747, batch_reg_loss: 0.1836, reg_loss: 0.1833 ||: 49%|####9 | 47/95 [00:29<00:26, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9430, LAS: 0.8925, UEM: 0.5749, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2560, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5963, loss: 0.7768, batch_reg_loss: 0.1837, reg_loss: 0.1833 ||: 55%|#####4 | 52/95 [00:32<00:23, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9423, LAS: 0.8914, UEM: 0.5673, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3642, partial_loss/deprel_loss: 1.0457, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2931, loss: 0.7864, batch_reg_loss: 0.1837, reg_loss: 0.1833 ||: 59%|#####8 | 56/95 [00:34<00:22, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9403, LAS: 0.8895, UEM: 0.5516, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8775, partial_loss/deprel_loss: 0.8152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0115, loss: 0.8033, batch_reg_loss: 0.1838, reg_loss: 0.1834 ||: 63%|######3 | 60/95 [00:37<00:21, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9389, LAS: 0.8881, UEM: 0.5582, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9317, partial_loss/deprel_loss: 0.8423, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0441, loss: 0.8129, batch_reg_loss: 0.1838, reg_loss: 0.1834 ||: 67%|######7 | 64/95 [00:40<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9395, LAS: 0.8886, UEM: 0.5596, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3226, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6661, loss: 0.8077, batch_reg_loss: 0.1839, reg_loss: 0.1834 ||: 72%|#######1 | 68/95 [00:43<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9394, LAS: 0.8886, UEM: 0.5535, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5394, partial_loss/deprel_loss: 0.6583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8185, loss: 0.8094, batch_reg_loss: 0.1840, reg_loss: 0.1834 ||: 76%|#######5 | 72/95 [00:45<00:15, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9399, LAS: 0.8891, UEM: 0.5571, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.8048, batch_reg_loss: 0.1840, reg_loss: 0.1835 ||: 79%|#######8 | 75/95 [00:48<00:13, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9399, LAS: 0.8891, UEM: 0.5653, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1215, partial_loss/deprel_loss: 0.3250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4684, loss: 0.8041, batch_reg_loss: 0.1841, reg_loss: 0.1835 ||: 82%|########2 | 78/95 [00:50<00:12, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9399, LAS: 0.8889, UEM: 0.5597, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6635, partial_loss/deprel_loss: 0.7208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8935, loss: 0.8050, batch_reg_loss: 0.1841, reg_loss: 0.1835 ||: 86%|########6 | 82/95 [00:52<00:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9406, LAS: 0.8896, UEM: 0.5637, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2760, partial_loss/deprel_loss: 0.4656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.8000, batch_reg_loss: 0.1842, reg_loss: 0.1835 ||: 89%|########9 | 85/95 [00:55<00:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9402, LAS: 0.8892, UEM: 0.5712, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5812, loss: 0.8039, batch_reg_loss: 0.1842, reg_loss: 0.1836 ||: 93%|#########2| 88/95 [00:57<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9401, LAS: 0.8893, UEM: 0.5745, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3026, partial_loss/deprel_loss: 0.3780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5472, loss: 0.8029, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||: 96%|#########5| 91/95 [00:59<00:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9405, LAS: 0.8898, UEM: 0.5815, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1445, partial_loss/deprel_loss: 0.3091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.7986, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||: 99%|#########8| 94/95 [01:02<00:00, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9405, LAS: 0.8898, UEM: 0.5795, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5905, partial_loss/deprel_loss: 0.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7710, loss: 0.7983, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:16:06,583 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - reg_loss | 0.184 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UEM | 0.580 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LEM | 0.338 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EM | 0.895 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.590 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.586 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - loss | 0.798 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:16:06,585 - INFO - combo.training.trainer - Epoch duration: 0:01:02.765135\n", + "2023-04-07 00:16:06,585 - INFO - combo.training.trainer - Estimated training time remaining: 6:02:52\n", + "2023-04-07 00:16:06,585 - INFO - allennlp.training.trainer - Epoch 77/399\n", + "2023-04-07 00:16:06,586 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:16:06,586 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:16:06,592 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9439, LAS: 0.8889, UEM: 0.4439, LEM: 0.1970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2992, partial_loss/deprel_loss: 0.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6209, loss: 0.8255, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||: 3%|3 | 3/95 [00:02<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9431, LAS: 0.8890, UEM: 0.4924, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8434, partial_loss/deprel_loss: 0.7793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9765, loss: 0.8081, batch_reg_loss: 0.1844, reg_loss: 0.1843 ||: 6%|6 | 6/95 [00:04<01:08, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9478, LAS: 0.8955, UEM: 0.5686, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5179, loss: 0.7473, batch_reg_loss: 0.1844, reg_loss: 0.1844 ||: 9%|9 | 9/95 [00:06<01:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9347, LAS: 0.8827, UEM: 0.4864, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7772, partial_loss/deprel_loss: 0.7062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9048, loss: 0.8470, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||: 14%|#3 | 13/95 [00:09<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9397, LAS: 0.8877, UEM: 0.5467, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1979, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.8047, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||: 17%|#6 | 16/95 [00:11<01:00, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9374, LAS: 0.8854, UEM: 0.5454, LEM: 0.2955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4462, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7495, loss: 0.8263, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||: 20%|## | 19/95 [00:14<00:58, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9405, LAS: 0.8888, UEM: 0.5523, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5662, partial_loss/deprel_loss: 0.6405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.8055, batch_reg_loss: 0.1846, reg_loss: 0.1845 ||: 24%|##4 | 23/95 [00:16<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9394, LAS: 0.8878, UEM: 0.5432, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.3998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.8084, batch_reg_loss: 0.1847, reg_loss: 0.1845 ||: 28%|##8 | 27/95 [00:19<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9340, LAS: 0.8821, UEM: 0.5129, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9194, partial_loss/deprel_loss: 0.8653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0609, loss: 0.8523, batch_reg_loss: 0.1847, reg_loss: 0.1845 ||: 33%|###2 | 31/95 [00:21<00:42, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9354, LAS: 0.8840, UEM: 0.5591, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.6119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7830, loss: 0.8391, batch_reg_loss: 0.1848, reg_loss: 0.1845 ||: 36%|###5 | 34/95 [00:24<00:41, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9371, LAS: 0.8851, UEM: 0.5599, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8156, partial_loss/deprel_loss: 0.7787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9709, loss: 0.8295, batch_reg_loss: 0.1848, reg_loss: 0.1846 ||: 41%|####1 | 39/95 [00:26<00:35, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9384, LAS: 0.8866, UEM: 0.5612, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4756, partial_loss/deprel_loss: 0.5991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7593, loss: 0.8215, batch_reg_loss: 0.1849, reg_loss: 0.1846 ||: 45%|####5 | 43/95 [00:29<00:33, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9381, LAS: 0.8864, UEM: 0.5519, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5294, partial_loss/deprel_loss: 0.6338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7978, loss: 0.8225, batch_reg_loss: 0.1850, reg_loss: 0.1846 ||: 49%|####9 | 47/95 [00:31<00:31, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9369, LAS: 0.8851, UEM: 0.5357, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9746, partial_loss/deprel_loss: 0.9515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1411, loss: 0.8355, batch_reg_loss: 0.1850, reg_loss: 0.1847 ||: 54%|#####3 | 51/95 [00:34<00:28, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9376, LAS: 0.8861, UEM: 0.5443, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2375, partial_loss/deprel_loss: 0.3977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.8279, batch_reg_loss: 0.1851, reg_loss: 0.1847 ||: 58%|#####7 | 55/95 [00:37<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9386, LAS: 0.8872, UEM: 0.5507, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.4675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.8197, batch_reg_loss: 0.1851, reg_loss: 0.1847 ||: 61%|######1 | 58/95 [00:39<00:25, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9364, LAS: 0.8849, UEM: 0.5422, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8464, partial_loss/deprel_loss: 0.7982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9930, loss: 0.8352, batch_reg_loss: 0.1852, reg_loss: 0.1847 ||: 65%|######5 | 62/95 [00:42<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9373, LAS: 0.8858, UEM: 0.5426, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3489, partial_loss/deprel_loss: 0.5047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6588, loss: 0.8285, batch_reg_loss: 0.1852, reg_loss: 0.1848 ||: 69%|######9 | 66/95 [00:44<00:19, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9378, LAS: 0.8860, UEM: 0.5439, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2682, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.8271, batch_reg_loss: 0.1853, reg_loss: 0.1848 ||: 74%|#######3 | 70/95 [00:47<00:16, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9374, LAS: 0.8858, UEM: 0.5356, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6694, loss: 0.8292, batch_reg_loss: 0.1853, reg_loss: 0.1848 ||: 78%|#######7 | 74/95 [00:49<00:13, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9384, LAS: 0.8870, UEM: 0.5484, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6598, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8299, loss: 0.8207, batch_reg_loss: 0.1854, reg_loss: 0.1848 ||: 82%|########2 | 78/95 [00:51<00:10, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9392, LAS: 0.8877, UEM: 0.5513, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4937, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7449, loss: 0.8148, batch_reg_loss: 0.1854, reg_loss: 0.1849 ||: 86%|########6 | 82/95 [00:54<00:07, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9389, LAS: 0.8873, UEM: 0.5511, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7606, partial_loss/deprel_loss: 0.7955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9740, loss: 0.8184, batch_reg_loss: 0.1855, reg_loss: 0.1849 ||: 91%|######### | 86/95 [00:56<00:05, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9400, LAS: 0.8885, UEM: 0.5753, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6608, partial_loss/deprel_loss: 0.7416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9110, loss: 0.8076, batch_reg_loss: 0.1855, reg_loss: 0.1849 ||: 95%|#########4| 90/95 [00:59<00:03, 1.63it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9410, LAS: 0.8896, UEM: 0.5826, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4913, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7294, loss: 0.7992, batch_reg_loss: 0.1856, reg_loss: 0.1850 ||: 99%|#########8| 94/95 [01:01<00:00, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9410, LAS: 0.8896, UEM: 0.5808, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5826, partial_loss/deprel_loss: 0.6339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8092, loss: 0.7993, batch_reg_loss: 0.1856, reg_loss: 0.1850 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 00:17:08,825 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:17:08,825 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - reg_loss | 0.185 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UEM | 0.581 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - LEM | 0.340 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EM | 0.885 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.583 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.634 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - loss | 0.799 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:17:08,827 - INFO - combo.training.trainer - Epoch duration: 0:01:02.242022\n", + "2023-04-07 00:17:08,828 - INFO - combo.training.trainer - Estimated training time remaining: 6:01:23\n", + "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - Epoch 78/399\n", + "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:17:08,835 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9408, LAS: 0.8896, UEM: 0.4489, LEM: 0.1972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3233, partial_loss/deprel_loss: 0.4872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6400, loss: 0.7744, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 4%|4 | 4/95 [00:02<00:50, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9516, LAS: 0.9008, UEM: 0.5703, LEM: 0.2929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4229, partial_loss/deprel_loss: 0.5818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.7034, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 9%|9 | 9/95 [00:04<00:44, 1.92it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9517, LAS: 0.9012, UEM: 0.5555, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4896, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7013, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||: 15%|#4 | 14/95 [00:06<00:40, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9517, LAS: 0.9016, UEM: 0.5903, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9200, partial_loss/deprel_loss: 0.7536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9726, loss: 0.6973, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||: 18%|#7 | 17/95 [00:08<00:43, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8616, UAS: 0.9495, LAS: 0.8992, UEM: 0.5741, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0144, partial_loss/deprel_loss: 0.8644, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0801, loss: 0.7219, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||: 21%|##1 | 20/95 [00:10<00:45, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9484, LAS: 0.8985, UEM: 0.5931, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2113, partial_loss/deprel_loss: 0.8566, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1133, loss: 0.7258, batch_reg_loss: 0.1857, reg_loss: 0.1857 ||: 24%|##4 | 23/95 [00:12<00:45, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9433, LAS: 0.8927, UEM: 0.5676, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9793, partial_loss/deprel_loss: 0.8778, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.7736, batch_reg_loss: 0.1858, reg_loss: 0.1857 ||: 28%|##8 | 27/95 [00:15<00:43, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9438, LAS: 0.8934, UEM: 0.5776, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1801, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.7694, batch_reg_loss: 0.1858, reg_loss: 0.1857 ||: 32%|###1 | 30/95 [00:17<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9449, LAS: 0.8951, UEM: 0.5874, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1557, partial_loss/deprel_loss: 0.3232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4756, loss: 0.7584, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||: 36%|###5 | 34/95 [00:20<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9446, LAS: 0.8950, UEM: 0.5828, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0273, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0282, loss: 0.7593, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||: 39%|###8 | 37/95 [00:22<00:39, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9452, LAS: 0.8955, UEM: 0.5810, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6163, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8693, loss: 0.7570, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||: 42%|####2 | 40/95 [00:24<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9457, LAS: 0.8963, UEM: 0.6039, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1135, partial_loss/deprel_loss: 0.2364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3978, loss: 0.7489, batch_reg_loss: 0.1860, reg_loss: 0.1857 ||: 45%|####5 | 43/95 [00:27<00:38, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9445, LAS: 0.8949, UEM: 0.6038, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5934, loss: 0.7595, batch_reg_loss: 0.1860, reg_loss: 0.1858 ||: 49%|####9 | 47/95 [00:30<00:34, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9448, LAS: 0.8950, UEM: 0.6067, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8152, loss: 0.7586, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||: 53%|#####2 | 50/95 [00:32<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9457, LAS: 0.8961, UEM: 0.6171, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4020, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.7499, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||: 56%|#####5 | 53/95 [00:34<00:31, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9461, LAS: 0.8965, UEM: 0.6158, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3005, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.7458, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||: 59%|#####8 | 56/95 [00:37<00:30, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9464, LAS: 0.8966, UEM: 0.6168, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7613, partial_loss/deprel_loss: 0.6916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8917, loss: 0.7440, batch_reg_loss: 0.1862, reg_loss: 0.1858 ||: 62%|######2 | 59/95 [00:39<00:29, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9471, LAS: 0.8972, UEM: 0.6218, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6331, loss: 0.7379, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||: 65%|######5 | 62/95 [00:42<00:26, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9469, LAS: 0.8969, UEM: 0.6130, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6629, partial_loss/deprel_loss: 0.6976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8769, loss: 0.7409, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||: 68%|######8 | 65/95 [00:44<00:22, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9460, LAS: 0.8959, UEM: 0.6022, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4262, partial_loss/deprel_loss: 0.5080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.7506, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||: 73%|#######2 | 69/95 [00:46<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9448, LAS: 0.8947, UEM: 0.5979, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0539, partial_loss/deprel_loss: 0.8267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0584, loss: 0.7597, batch_reg_loss: 0.1863, reg_loss: 0.1859 ||: 77%|#######6 | 73/95 [00:49<00:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9446, LAS: 0.8948, UEM: 0.6111, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2930, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1742, loss: 0.7602, batch_reg_loss: 0.1863, reg_loss: 0.1859 ||: 80%|######## | 76/95 [00:51<00:13, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9432, LAS: 0.8931, UEM: 0.6007, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6972, partial_loss/deprel_loss: 0.7468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9233, loss: 0.7716, batch_reg_loss: 0.1864, reg_loss: 0.1859 ||: 84%|########4 | 80/95 [00:53<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9420, LAS: 0.8918, UEM: 0.5955, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 0.7820, batch_reg_loss: 0.1864, reg_loss: 0.1860 ||: 88%|########8 | 84/95 [00:56<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9415, LAS: 0.8910, UEM: 0.5861, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5924, partial_loss/deprel_loss: 0.6303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8092, loss: 0.7896, batch_reg_loss: 0.1865, reg_loss: 0.1860 ||: 93%|#########2| 88/95 [00:59<00:04, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9401, LAS: 0.8894, UEM: 0.5803, LEM: 0.3445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5862, loss: 0.7997, batch_reg_loss: 0.1866, reg_loss: 0.1860 ||: 97%|#########6| 92/95 [01:01<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9401, LAS: 0.8894, UEM: 0.5777, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8968, partial_loss/deprel_loss: 0.7831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9924, loss: 0.8005, batch_reg_loss: 0.1866, reg_loss: 0.1860 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - reg_loss | 0.186 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - UEM | 0.578 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - LEM | 0.340 | N/A\n", + "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EM | 0.866 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.897 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.783 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - loss | 0.800 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:12,490 - INFO - combo.training.trainer - Epoch duration: 0:01:03.662416\n", + "2023-04-07 00:18:12,490 - INFO - combo.training.trainer - Estimated training time remaining: 6:00:01\n", + "2023-04-07 00:18:12,490 - INFO - allennlp.training.trainer - Epoch 79/399\n", + "2023-04-07 00:18:12,490 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:18:12,491 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:18:12,498 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9283, LAS: 0.8772, UEM: 0.4899, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2977, partial_loss/deprel_loss: 0.4617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6156, loss: 0.8829, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||: 3%|3 | 3/95 [00:02<01:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9239, LAS: 0.8754, UEM: 0.5283, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3208, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.8969, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||: 6%|6 | 6/95 [00:04<01:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9365, LAS: 0.8881, UEM: 0.5864, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4957, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8162, loss: 0.8139, batch_reg_loss: 0.1868, reg_loss: 0.1867 ||: 9%|9 | 9/95 [00:06<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9396, LAS: 0.8913, UEM: 0.6205, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4121, partial_loss/deprel_loss: 0.5223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.7861, batch_reg_loss: 0.1868, reg_loss: 0.1867 ||: 13%|#2 | 12/95 [00:08<01:01, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9441, LAS: 0.8958, UEM: 0.6585, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2032, partial_loss/deprel_loss: 0.3666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5207, loss: 0.7440, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||: 16%|#5 | 15/95 [00:11<01:00, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9459, LAS: 0.8981, UEM: 0.6616, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.4213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.7234, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||: 19%|#8 | 18/95 [00:13<00:59, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9478, LAS: 0.9004, UEM: 0.6716, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6162, partial_loss/deprel_loss: 0.6331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8167, loss: 0.7079, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||: 22%|##2 | 21/95 [00:15<00:55, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9474, LAS: 0.9000, UEM: 0.6755, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0440, partial_loss/deprel_loss: 0.8140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0470, loss: 0.7136, batch_reg_loss: 0.1870, reg_loss: 0.1868 ||: 25%|##5 | 24/95 [00:18<00:55, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9417, LAS: 0.8937, UEM: 0.6401, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.8241, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0568, loss: 0.7640, batch_reg_loss: 0.1870, reg_loss: 0.1868 ||: 29%|##9 | 28/95 [00:20<00:49, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9379, LAS: 0.8896, UEM: 0.6116, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3279, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1551, loss: 0.7982, batch_reg_loss: 0.1870, reg_loss: 0.1869 ||: 34%|###3 | 32/95 [00:23<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9366, LAS: 0.8882, UEM: 0.5996, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3334, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.8117, batch_reg_loss: 0.1871, reg_loss: 0.1869 ||: 38%|###7 | 36/95 [00:25<00:37, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8622, UAS: 0.9358, LAS: 0.8873, UEM: 0.5815, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8832, partial_loss/deprel_loss: 0.7934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9985, loss: 0.8199, batch_reg_loss: 0.1872, reg_loss: 0.1869 ||: 43%|####3 | 41/95 [00:27<00:32, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9343, LAS: 0.8852, UEM: 0.5650, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0274, partial_loss/deprel_loss: 0.8131, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0432, loss: 0.8361, batch_reg_loss: 0.1873, reg_loss: 0.1870 ||: 48%|####8 | 46/95 [00:29<00:27, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9351, LAS: 0.8856, UEM: 0.5620, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7816, loss: 0.8314, batch_reg_loss: 0.1873, reg_loss: 0.1870 ||: 53%|#####2 | 50/95 [00:31<00:24, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9369, LAS: 0.8876, UEM: 0.5930, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5163, partial_loss/deprel_loss: 0.5533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.8152, batch_reg_loss: 0.1874, reg_loss: 0.1870 ||: 57%|#####6 | 54/95 [00:35<00:25, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8488, UAS: 0.9359, LAS: 0.8866, UEM: 0.5788, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1207, partial_loss/deprel_loss: 0.8376, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0817, loss: 0.8220, batch_reg_loss: 0.1875, reg_loss: 0.1870 ||: 61%|######1 | 58/95 [00:37<00:23, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9366, LAS: 0.8873, UEM: 0.5778, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 0.5361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.8168, batch_reg_loss: 0.1875, reg_loss: 0.1871 ||: 65%|######5 | 62/95 [00:40<00:21, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9374, LAS: 0.8880, UEM: 0.5757, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8132, batch_reg_loss: 0.1876, reg_loss: 0.1871 ||: 69%|######9 | 66/95 [00:43<00:18, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9378, LAS: 0.8881, UEM: 0.5715, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8813, loss: 0.8116, batch_reg_loss: 0.1876, reg_loss: 0.1871 ||: 74%|#######3 | 70/95 [00:45<00:16, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9375, LAS: 0.8878, UEM: 0.5671, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.3709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5340, loss: 0.8145, batch_reg_loss: 0.1877, reg_loss: 0.1872 ||: 78%|#######7 | 74/95 [00:48<00:13, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9382, LAS: 0.8884, UEM: 0.5671, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4622, partial_loss/deprel_loss: 0.5921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8099, batch_reg_loss: 0.1877, reg_loss: 0.1872 ||: 82%|########2 | 78/95 [00:50<00:10, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9385, LAS: 0.8885, UEM: 0.5614, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6567, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8476, loss: 0.8097, batch_reg_loss: 0.1878, reg_loss: 0.1872 ||: 86%|########6 | 82/95 [00:53<00:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9396, LAS: 0.8897, UEM: 0.5765, LEM: 0.3417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4273, partial_loss/deprel_loss: 0.5450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 0.8001, batch_reg_loss: 0.1878, reg_loss: 0.1872 ||: 91%|######### | 86/95 [00:55<00:05, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9400, LAS: 0.8899, UEM: 0.5763, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3665, partial_loss/deprel_loss: 0.5096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6688, loss: 0.7984, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||: 95%|#########4| 90/95 [00:58<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9405, LAS: 0.8904, UEM: 0.5754, LEM: 0.3353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3016, partial_loss/deprel_loss: 0.5141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6595, loss: 0.7965, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||: 99%|#########8| 94/95 [01:01<00:00, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9408, LAS: 0.8907, UEM: 0.5806, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2214, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5335, loss: 0.7937, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||: 100%|##########| 95/95 [01:01<00:00, 1.53it/s]\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - reg_loss | 0.187 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UEM | 0.581 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - LEM | 0.340 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EM | 0.920 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.221 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.377 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - loss | 0.794 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - LAS | 0.891 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:19:14,424 - INFO - combo.training.trainer - Epoch duration: 0:01:01.933450\n", + "2023-04-07 00:19:14,424 - INFO - combo.training.trainer - Estimated training time remaining: 5:58:32\n", + "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - Epoch 80/399\n", + "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:19:14,431 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9596, LAS: 0.9109, UEM: 0.6800, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1690, partial_loss/deprel_loss: 0.3843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5292, loss: 0.6419, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 4%|4 | 4/95 [00:02<01:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9480, LAS: 0.8989, UEM: 0.6161, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5638, loss: 0.7364, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 7%|7 | 7/95 [00:05<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9512, LAS: 0.9017, UEM: 0.6269, LEM: 0.3572, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.7124, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 12%|#1 | 11/95 [00:07<01:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9506, LAS: 0.9014, UEM: 0.6104, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6724, loss: 0.7203, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||: 15%|#4 | 14/95 [00:10<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9499, LAS: 0.9004, UEM: 0.5876, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2876, partial_loss/deprel_loss: 0.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7232, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||: 19%|#8 | 18/95 [00:12<00:52, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9505, LAS: 0.9008, UEM: 0.5854, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5094, partial_loss/deprel_loss: 0.5760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7508, loss: 0.7181, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||: 22%|##2 | 21/95 [00:14<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9527, LAS: 0.9041, UEM: 0.6489, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3647, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.6928, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||: 25%|##5 | 24/95 [00:17<00:53, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9512, LAS: 0.9019, UEM: 0.6426, LEM: 0.3904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5918, partial_loss/deprel_loss: 0.6836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8535, loss: 0.7120, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||: 29%|##9 | 28/95 [00:19<00:48, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9469, LAS: 0.8971, UEM: 0.6465, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1478, partial_loss/deprel_loss: 0.3533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.7485, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||: 33%|###2 | 31/95 [00:22<00:48, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9449, LAS: 0.8948, UEM: 0.6225, LEM: 0.3811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7762, loss: 0.7667, batch_reg_loss: 0.1883, reg_loss: 0.1881 ||: 37%|###6 | 35/95 [00:25<00:44, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9454, LAS: 0.8954, UEM: 0.6357, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6944, partial_loss/deprel_loss: 0.7790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9504, loss: 0.7592, batch_reg_loss: 0.1883, reg_loss: 0.1881 ||: 40%|#### | 38/95 [00:27<00:42, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9443, LAS: 0.8940, UEM: 0.6177, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6552, loss: 0.7663, batch_reg_loss: 0.1884, reg_loss: 0.1881 ||: 44%|####4 | 42/95 [00:30<00:38, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9422, LAS: 0.8914, UEM: 0.5969, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8455, partial_loss/deprel_loss: 0.6861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9064, loss: 0.7889, batch_reg_loss: 0.1884, reg_loss: 0.1882 ||: 48%|####8 | 46/95 [00:32<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9425, LAS: 0.8919, UEM: 0.5920, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5160, partial_loss/deprel_loss: 0.7093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8591, loss: 0.7868, batch_reg_loss: 0.1885, reg_loss: 0.1882 ||: 52%|#####1 | 49/95 [00:34<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8074, UAS: 0.9416, LAS: 0.8908, UEM: 0.5890, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6451, partial_loss/deprel_loss: 1.1061, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4024, loss: 0.7942, batch_reg_loss: 0.1885, reg_loss: 0.1882 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9404, LAS: 0.8894, UEM: 0.5855, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.4170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.8047, batch_reg_loss: 0.1886, reg_loss: 0.1882 ||: 58%|#####7 | 55/95 [00:39<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9407, LAS: 0.8896, UEM: 0.5849, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.4808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6261, loss: 0.8032, batch_reg_loss: 0.1886, reg_loss: 0.1882 ||: 61%|######1 | 58/95 [00:41<00:28, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9413, LAS: 0.8899, UEM: 0.5889, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2398, partial_loss/deprel_loss: 0.4865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7995, batch_reg_loss: 0.1887, reg_loss: 0.1883 ||: 64%|######4 | 61/95 [00:43<00:25, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9420, LAS: 0.8905, UEM: 0.5975, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4616, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7639, loss: 0.7946, batch_reg_loss: 0.1887, reg_loss: 0.1883 ||: 68%|######8 | 65/95 [00:46<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9431, LAS: 0.8917, UEM: 0.6147, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5303, partial_loss/deprel_loss: 0.6276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7969, loss: 0.7829, batch_reg_loss: 0.1888, reg_loss: 0.1883 ||: 73%|#######2 | 69/95 [00:48<00:16, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9418, LAS: 0.8903, UEM: 0.6083, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9466, partial_loss/deprel_loss: 0.7993, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0175, loss: 0.7934, batch_reg_loss: 0.1888, reg_loss: 0.1883 ||: 78%|#######7 | 74/95 [00:50<00:12, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9411, LAS: 0.8898, UEM: 0.5973, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0785, partial_loss/deprel_loss: 0.8666, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0979, loss: 0.7982, batch_reg_loss: 0.1889, reg_loss: 0.1884 ||: 83%|########3 | 79/95 [00:52<00:08, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9412, LAS: 0.8899, UEM: 0.5901, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.7978, batch_reg_loss: 0.1889, reg_loss: 0.1884 ||: 87%|########7 | 83/95 [00:57<00:08, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8699, UAS: 0.9408, LAS: 0.8894, UEM: 0.5842, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7730, partial_loss/deprel_loss: 0.7625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9536, loss: 0.8019, batch_reg_loss: 0.1890, reg_loss: 0.1884 ||: 92%|#########1| 87/95 [01:00<00:05, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9403, LAS: 0.8888, UEM: 0.5809, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3301, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1725, loss: 0.8064, batch_reg_loss: 0.1890, reg_loss: 0.1884 ||: 96%|#########5| 91/95 [01:02<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9402, LAS: 0.8888, UEM: 0.5777, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 0.8068, batch_reg_loss: 0.1891, reg_loss: 0.1885 ||: 100%|##########| 95/95 [01:05<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9402, LAS: 0.8888, UEM: 0.5777, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 0.8068, batch_reg_loss: 0.1891, reg_loss: 0.1885 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-07 00:20:19,918 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9691, LAS: 0.9273, UEM: 0.8205, LEM: 0.5921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 17.6571, partial_loss/cycle_loss: 0.0000, batch_loss: 14.1622, loss: 18.2288, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:06, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9466, LAS: 0.8977, UEM: 0.7012, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5806, partial_loss/deprel_loss: 53.6078, partial_loss/cycle_loss: 0.0000, batch_loss: 43.2024, loss: 23.0699, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9507, LAS: 0.9004, UEM: 0.7089, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8707, partial_loss/deprel_loss: 32.8457, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4507, loss: 22.7814, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9472, LAS: 0.8956, UEM: 0.6708, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0470, partial_loss/deprel_loss: 41.2218, partial_loss/cycle_loss: 0.0000, batch_loss: 33.1868, loss: 25.0364, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.06it/s]\n", + "2023-04-07 00:20:30,262 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - reg_loss | 0.188 | 0.000\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UEM | 0.578 | 0.671\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - LEM | 0.337 | 0.403\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EM | 0.863 | 0.871\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.851 | 1.047\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | 0.947\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.810 | 41.222\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - loss | 0.807 | 25.036\n", + "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - LAS | 0.889 | 0.896\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:20:30,265 - INFO - combo.training.trainer - Epoch duration: 0:01:15.840607\n", + "2023-04-07 00:20:30,265 - INFO - combo.training.trainer - Estimated training time remaining: 5:57:59\n", + "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - Epoch 81/399\n", + "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:20:30,272 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9532, LAS: 0.9055, UEM: 0.5120, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4113, partial_loss/deprel_loss: 0.5896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7431, loss: 0.6814, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9465, LAS: 0.8960, UEM: 0.4424, LEM: 0.1781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.6396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8196, loss: 0.7523, batch_reg_loss: 0.1892, reg_loss: 0.1891 ||: 8%|8 | 8/95 [00:05<00:55, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9517, LAS: 0.9022, UEM: 0.5925, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.7044, batch_reg_loss: 0.1892, reg_loss: 0.1892 ||: 12%|#1 | 11/95 [00:07<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9473, LAS: 0.8976, UEM: 0.5870, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.4169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5857, loss: 0.7374, batch_reg_loss: 0.1893, reg_loss: 0.1892 ||: 15%|#4 | 14/95 [00:09<00:57, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9491, LAS: 0.8992, UEM: 0.5768, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3695, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6929, loss: 0.7260, batch_reg_loss: 0.1893, reg_loss: 0.1892 ||: 19%|#8 | 18/95 [00:12<00:52, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9461, LAS: 0.8960, UEM: 0.5606, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3091, partial_loss/deprel_loss: 0.4978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.7472, batch_reg_loss: 0.1894, reg_loss: 0.1892 ||: 23%|##3 | 22/95 [00:14<00:48, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9437, LAS: 0.8932, UEM: 0.5314, LEM: 0.2714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9095, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1428, loss: 0.7699, batch_reg_loss: 0.1894, reg_loss: 0.1893 ||: 27%|##7 | 26/95 [00:17<00:46, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9407, LAS: 0.8901, UEM: 0.5317, LEM: 0.2779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6746, partial_loss/deprel_loss: 1.0439, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3595, loss: 0.7930, batch_reg_loss: 0.1894, reg_loss: 0.1893 ||: 31%|### | 29/95 [00:19<00:46, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9421, LAS: 0.8916, UEM: 0.5485, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.7818, batch_reg_loss: 0.1895, reg_loss: 0.1893 ||: 34%|###3 | 32/95 [00:22<00:45, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9428, LAS: 0.8925, UEM: 0.5586, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5909, loss: 0.7759, batch_reg_loss: 0.1895, reg_loss: 0.1893 ||: 37%|###6 | 35/95 [00:24<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9435, LAS: 0.8932, UEM: 0.5609, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 0.4473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5903, loss: 0.7733, batch_reg_loss: 0.1896, reg_loss: 0.1893 ||: 41%|####1 | 39/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9444, LAS: 0.8943, UEM: 0.5979, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2540, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.7647, batch_reg_loss: 0.1896, reg_loss: 0.1894 ||: 44%|####4 | 42/95 [00:29<00:40, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9431, LAS: 0.8931, UEM: 0.6082, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4032, partial_loss/deprel_loss: 0.9042, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1936, loss: 0.7752, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||: 47%|####7 | 45/95 [00:31<00:37, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9439, LAS: 0.8941, UEM: 0.6117, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4422, partial_loss/deprel_loss: 0.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7067, loss: 0.7698, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||: 51%|##### | 48/95 [00:34<00:36, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9430, LAS: 0.8932, UEM: 0.6004, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6614, partial_loss/deprel_loss: 0.6990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8812, loss: 0.7761, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||: 54%|#####3 | 51/95 [00:36<00:33, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9410, LAS: 0.8910, UEM: 0.5863, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6204, partial_loss/deprel_loss: 0.6619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.7930, batch_reg_loss: 0.1898, reg_loss: 0.1894 ||: 58%|#####7 | 55/95 [00:39<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9415, LAS: 0.8917, UEM: 0.5858, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5730, loss: 0.7890, batch_reg_loss: 0.1898, reg_loss: 0.1895 ||: 62%|######2 | 59/95 [00:41<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9417, LAS: 0.8917, UEM: 0.5870, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2479, partial_loss/deprel_loss: 0.3969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.7890, batch_reg_loss: 0.1899, reg_loss: 0.1895 ||: 65%|######5 | 62/95 [00:44<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9418, LAS: 0.8917, UEM: 0.5857, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7133, partial_loss/deprel_loss: 0.6690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8678, loss: 0.7870, batch_reg_loss: 0.1899, reg_loss: 0.1895 ||: 68%|######8 | 65/95 [00:46<00:21, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8292, UAS: 0.9408, LAS: 0.8906, UEM: 0.5769, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4467, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3266, loss: 0.7982, batch_reg_loss: 0.1900, reg_loss: 0.1895 ||: 72%|#######1 | 68/95 [00:48<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9413, LAS: 0.8911, UEM: 0.5811, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1525, partial_loss/deprel_loss: 0.3706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5170, loss: 0.7954, batch_reg_loss: 0.1900, reg_loss: 0.1896 ||: 76%|#######5 | 72/95 [00:50<00:15, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9413, LAS: 0.8908, UEM: 0.5743, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4549, partial_loss/deprel_loss: 0.5787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.7975, batch_reg_loss: 0.1901, reg_loss: 0.1896 ||: 80%|######## | 76/95 [00:53<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9407, LAS: 0.8899, UEM: 0.5642, LEM: 0.3228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0134, partial_loss/deprel_loss: 0.7880, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0232, loss: 0.8038, batch_reg_loss: 0.1901, reg_loss: 0.1896 ||: 84%|########4 | 80/95 [00:55<00:09, 1.61it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9418, LAS: 0.8909, UEM: 0.5782, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5291, partial_loss/deprel_loss: 0.6351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8040, loss: 0.7943, batch_reg_loss: 0.1902, reg_loss: 0.1896 ||: 89%|########9 | 85/95 [00:57<00:05, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9418, LAS: 0.8910, UEM: 0.5920, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.7921, batch_reg_loss: 0.1902, reg_loss: 0.1897 ||: 95%|#########4| 90/95 [01:00<00:02, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9413, LAS: 0.8902, UEM: 0.5830, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7992, batch_reg_loss: 0.1903, reg_loss: 0.1897 ||: 100%|##########| 95/95 [01:02<00:00, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9413, LAS: 0.8902, UEM: 0.5830, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7992, batch_reg_loss: 0.1903, reg_loss: 0.1897 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:21:33,036 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - reg_loss | 0.190 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - LEM | 0.335 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EM | 0.897 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.430 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.612 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - loss | 0.799 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:33,038 - INFO - combo.training.trainer - Epoch duration: 0:01:02.773691\n", + "2023-04-07 00:21:33,039 - INFO - combo.training.trainer - Estimated training time remaining: 5:56:34\n", + "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - Epoch 82/399\n", + "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:21:33,046 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9454, LAS: 0.8927, UEM: 0.4833, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4030, partial_loss/deprel_loss: 0.5688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7260, loss: 0.7748, batch_reg_loss: 0.1903, reg_loss: 0.1903 ||: 4%|4 | 4/95 [00:02<00:58, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9485, LAS: 0.8984, UEM: 0.5650, LEM: 0.3109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5287, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7443, loss: 0.7361, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 8%|8 | 8/95 [00:05<00:55, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9496, LAS: 0.8982, UEM: 0.5911, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.7561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9382, loss: 0.7368, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 12%|#1 | 11/95 [00:07<00:54, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9496, LAS: 0.8991, UEM: 0.5772, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3317, partial_loss/deprel_loss: 0.5018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.7337, batch_reg_loss: 0.1905, reg_loss: 0.1904 ||: 16%|#5 | 15/95 [00:09<00:51, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9427, LAS: 0.8916, UEM: 0.5607, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9665, partial_loss/deprel_loss: 1.0984, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4625, loss: 0.7855, batch_reg_loss: 0.1905, reg_loss: 0.1904 ||: 19%|#8 | 18/95 [00:12<00:53, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9454, LAS: 0.8947, UEM: 0.5856, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2318, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.7637, batch_reg_loss: 0.1906, reg_loss: 0.1904 ||: 22%|##2 | 21/95 [00:14<00:53, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9450, LAS: 0.8941, UEM: 0.5764, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6122, loss: 0.7734, batch_reg_loss: 0.1906, reg_loss: 0.1905 ||: 26%|##6 | 25/95 [00:16<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9443, LAS: 0.8936, UEM: 0.5872, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5380, loss: 0.7777, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||: 29%|##9 | 28/95 [00:19<00:48, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9446, LAS: 0.8944, UEM: 0.6237, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.2652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4289, loss: 0.7715, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||: 33%|###2 | 31/95 [00:21<00:47, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9454, LAS: 0.8951, UEM: 0.6163, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6524, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8422, loss: 0.7654, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||: 37%|###6 | 35/95 [00:24<00:42, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9465, LAS: 0.8960, UEM: 0.6211, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6097, loss: 0.7576, batch_reg_loss: 0.1908, reg_loss: 0.1905 ||: 40%|#### | 38/95 [00:26<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9463, LAS: 0.8960, UEM: 0.6213, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1968, partial_loss/deprel_loss: 0.8406, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1027, loss: 0.7585, batch_reg_loss: 0.1908, reg_loss: 0.1906 ||: 43%|####3 | 41/95 [00:28<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9473, LAS: 0.8972, UEM: 0.6317, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2926, partial_loss/deprel_loss: 0.4871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6391, loss: 0.7465, batch_reg_loss: 0.1908, reg_loss: 0.1906 ||: 46%|####6 | 44/95 [00:31<00:39, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9456, LAS: 0.8952, UEM: 0.6137, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5593, partial_loss/deprel_loss: 0.5878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7730, loss: 0.7609, batch_reg_loss: 0.1909, reg_loss: 0.1906 ||: 51%|##### | 48/95 [00:33<00:34, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9454, LAS: 0.8951, UEM: 0.6163, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2513, partial_loss/deprel_loss: 0.9229, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1795, loss: 0.7621, batch_reg_loss: 0.1909, reg_loss: 0.1906 ||: 55%|#####4 | 52/95 [00:36<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9464, LAS: 0.8965, UEM: 0.6368, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4366, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.7526, batch_reg_loss: 0.1910, reg_loss: 0.1906 ||: 58%|#####7 | 55/95 [00:38<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9463, LAS: 0.8961, UEM: 0.6380, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7707, partial_loss/deprel_loss: 0.7863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.7552, batch_reg_loss: 0.1910, reg_loss: 0.1907 ||: 61%|######1 | 58/95 [00:40<00:26, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9463, LAS: 0.8962, UEM: 0.6314, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8695, partial_loss/deprel_loss: 0.7489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9641, loss: 0.7544, batch_reg_loss: 0.1910, reg_loss: 0.1907 ||: 65%|######5 | 62/95 [00:42<00:22, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9459, LAS: 0.8956, UEM: 0.6232, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4445, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.7598, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||: 68%|######8 | 65/95 [00:45<00:21, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9439, LAS: 0.8935, UEM: 0.6157, LEM: 0.3744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4739, partial_loss/deprel_loss: 0.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7400, loss: 0.7744, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9430, LAS: 0.8924, UEM: 0.6092, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3128, partial_loss/deprel_loss: 0.9474, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2116, loss: 0.7842, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||: 75%|#######4 | 71/95 [00:49<00:17, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9436, LAS: 0.8929, UEM: 0.6133, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4393, partial_loss/deprel_loss: 0.5510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7199, loss: 0.7798, batch_reg_loss: 0.1912, reg_loss: 0.1908 ||: 78%|#######7 | 74/95 [00:52<00:15, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9429, LAS: 0.8922, UEM: 0.6096, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.3906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.7844, batch_reg_loss: 0.1913, reg_loss: 0.1908 ||: 82%|########2 | 78/95 [00:54<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9426, LAS: 0.8916, UEM: 0.6021, LEM: 0.3612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3763, partial_loss/deprel_loss: 0.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6555, loss: 0.7880, batch_reg_loss: 0.1913, reg_loss: 0.1908 ||: 86%|########6 | 82/95 [00:57<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9417, LAS: 0.8905, UEM: 0.5911, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8662, partial_loss/deprel_loss: 0.7807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9892, loss: 0.7954, batch_reg_loss: 0.1914, reg_loss: 0.1908 ||: 91%|######### | 86/95 [00:59<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9417, LAS: 0.8904, UEM: 0.5910, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2937, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6542, loss: 0.7962, batch_reg_loss: 0.1914, reg_loss: 0.1909 ||: 94%|#########3| 89/95 [01:02<00:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9420, LAS: 0.8908, UEM: 0.5895, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4636, partial_loss/deprel_loss: 0.5941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7595, loss: 0.7946, batch_reg_loss: 0.1915, reg_loss: 0.1909 ||: 98%|#########7| 93/95 [01:05<00:01, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9412, LAS: 0.8899, UEM: 0.5850, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3715, partial_loss/deprel_loss: 1.0574, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3117, loss: 0.8027, batch_reg_loss: 0.1915, reg_loss: 0.1909 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - reg_loss | 0.191 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UEM | 0.585 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - LEM | 0.347 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EM | 0.833 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.372 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.057 | N/A\n", + "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - loss | 0.803 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:39,477 - INFO - combo.training.trainer - Epoch duration: 0:01:06.437919\n", + "2023-04-07 00:22:39,477 - INFO - combo.training.trainer - Estimated training time remaining: 5:55:24\n", + "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - Epoch 83/399\n", + "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:22:39,484 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9375, LAS: 0.8905, UEM: 0.5267, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2462, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.7993, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 3%|3 | 3/95 [00:02<01:11, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.9347, LAS: 0.8856, UEM: 0.5202, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6103, partial_loss/deprel_loss: 0.9962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3106, loss: 0.8429, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 6%|6 | 6/95 [00:04<01:06, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8114, UAS: 0.9304, LAS: 0.8810, UEM: 0.5515, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6095, partial_loss/deprel_loss: 1.1064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3986, loss: 0.8810, batch_reg_loss: 0.1917, reg_loss: 0.1916 ||: 9%|9 | 9/95 [00:06<01:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9339, LAS: 0.8839, UEM: 0.5453, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9913, partial_loss/deprel_loss: 0.7666, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0033, loss: 0.8616, batch_reg_loss: 0.1917, reg_loss: 0.1916 ||: 13%|#2 | 12/95 [00:08<01:01, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.9338, LAS: 0.8836, UEM: 0.5344, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3335, partial_loss/deprel_loss: 0.9585, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2253, loss: 0.8581, batch_reg_loss: 0.1918, reg_loss: 0.1917 ||: 18%|#7 | 17/95 [00:11<00:51, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9382, LAS: 0.8884, UEM: 0.5477, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.4284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.8215, batch_reg_loss: 0.1919, reg_loss: 0.1917 ||: 23%|##3 | 22/95 [00:13<00:43, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8598, UAS: 0.9377, LAS: 0.8880, UEM: 0.5889, LEM: 0.3612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9696, partial_loss/deprel_loss: 0.8608, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0744, loss: 0.8261, batch_reg_loss: 0.1919, reg_loss: 0.1917 ||: 27%|##7 | 26/95 [00:15<00:39, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9411, LAS: 0.8912, UEM: 0.6167, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2082, partial_loss/deprel_loss: 0.4205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5700, loss: 0.7990, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||: 32%|###1 | 30/95 [00:17<00:37, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9389, LAS: 0.8886, UEM: 0.5864, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8068, partial_loss/deprel_loss: 0.6758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8940, loss: 0.8122, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||: 36%|###5 | 34/95 [00:20<00:36, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9380, LAS: 0.8880, UEM: 0.5727, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9398, partial_loss/deprel_loss: 0.7578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9862, loss: 0.8187, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||: 40%|#### | 38/95 [00:22<00:34, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9399, LAS: 0.8897, UEM: 0.5863, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3260, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.8047, batch_reg_loss: 0.1921, reg_loss: 0.1918 ||: 44%|####4 | 42/95 [00:25<00:34, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9413, LAS: 0.8914, UEM: 0.5879, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6506, partial_loss/deprel_loss: 0.6128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8125, loss: 0.7936, batch_reg_loss: 0.1921, reg_loss: 0.1919 ||: 48%|####8 | 46/95 [00:28<00:31, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9409, LAS: 0.8906, UEM: 0.5728, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8299, partial_loss/deprel_loss: 0.7765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9793, loss: 0.7979, batch_reg_loss: 0.1922, reg_loss: 0.1919 ||: 53%|#####2 | 50/95 [00:30<00:27, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9421, LAS: 0.8921, UEM: 0.5738, LEM: 0.3254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3728, partial_loss/deprel_loss: 0.5539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7100, loss: 0.7881, batch_reg_loss: 0.1922, reg_loss: 0.1919 ||: 57%|#####6 | 54/95 [00:32<00:24, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9421, LAS: 0.8923, UEM: 0.5675, LEM: 0.3222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3272, partial_loss/deprel_loss: 0.3356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5262, loss: 0.7879, batch_reg_loss: 0.1923, reg_loss: 0.1919 ||: 61%|######1 | 58/95 [00:35<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9409, LAS: 0.8907, UEM: 0.5630, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3436, partial_loss/deprel_loss: 0.9344, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2085, loss: 0.7989, batch_reg_loss: 0.1923, reg_loss: 0.1920 ||: 65%|######5 | 62/95 [00:38<00:21, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9404, LAS: 0.8903, UEM: 0.5566, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4736, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8042, batch_reg_loss: 0.1924, reg_loss: 0.1920 ||: 69%|######9 | 66/95 [00:41<00:19, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9413, LAS: 0.8911, UEM: 0.5739, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4320, partial_loss/deprel_loss: 0.6516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.7970, batch_reg_loss: 0.1924, reg_loss: 0.1920 ||: 74%|#######3 | 70/95 [00:44<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9412, LAS: 0.8909, UEM: 0.5722, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7803, partial_loss/deprel_loss: 0.8010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9893, loss: 0.7986, batch_reg_loss: 0.1925, reg_loss: 0.1920 ||: 77%|#######6 | 73/95 [00:46<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9411, LAS: 0.8906, UEM: 0.5774, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.8013, batch_reg_loss: 0.1925, reg_loss: 0.1920 ||: 80%|######## | 76/95 [00:48<00:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9402, LAS: 0.8895, UEM: 0.5729, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5167, partial_loss/deprel_loss: 0.5689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7510, loss: 0.8102, batch_reg_loss: 0.1926, reg_loss: 0.1921 ||: 84%|########4 | 80/95 [00:50<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9414, LAS: 0.8909, UEM: 0.5957, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.7994, batch_reg_loss: 0.1926, reg_loss: 0.1921 ||: 87%|########7 | 83/95 [00:53<00:08, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9407, LAS: 0.8902, UEM: 0.5896, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2760, partial_loss/deprel_loss: 0.9142, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1792, loss: 0.8046, batch_reg_loss: 0.1927, reg_loss: 0.1921 ||: 92%|#########1| 87/95 [00:55<00:05, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9407, LAS: 0.8903, UEM: 0.5877, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2826, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.8036, batch_reg_loss: 0.1927, reg_loss: 0.1921 ||: 95%|#########4| 90/95 [00:58<00:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9409, LAS: 0.8905, UEM: 0.5866, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6252, loss: 0.8015, batch_reg_loss: 0.1928, reg_loss: 0.1922 ||: 98%|#########7| 93/95 [01:00<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9408, LAS: 0.8904, UEM: 0.5829, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5981, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8536, loss: 0.8021, batch_reg_loss: 0.1928, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 00:23:40,869 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - LEM | 0.342 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EM | 0.884 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.598 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.676 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - LAS | 0.890 | N/A\n", + "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:23:40,871 - INFO - combo.training.trainer - Epoch duration: 0:01:01.394685\n", + "2023-04-07 00:23:40,872 - INFO - combo.training.trainer - Estimated training time remaining: 5:53:54\n", + "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - Epoch 84/399\n", + "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:23:40,879 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9451, LAS: 0.8962, UEM: 0.5269, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4271, partial_loss/deprel_loss: 0.4962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6752, loss: 0.7608, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 4%|4 | 4/95 [00:02<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9516, LAS: 0.9027, UEM: 0.6270, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1486, partial_loss/deprel_loss: 0.3714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7151, batch_reg_loss: 0.1929, reg_loss: 0.1928 ||: 7%|7 | 7/95 [00:05<01:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9464, LAS: 0.8968, UEM: 0.5877, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0149, partial_loss/deprel_loss: 0.8171, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0496, loss: 0.7587, batch_reg_loss: 0.1929, reg_loss: 0.1929 ||: 11%|# | 10/95 [00:07<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9475, LAS: 0.8987, UEM: 0.5835, LEM: 0.3159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.6744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.7560, batch_reg_loss: 0.1929, reg_loss: 0.1929 ||: 14%|#3 | 13/95 [00:09<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9491, LAS: 0.9002, UEM: 0.5839, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.4450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.7433, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||: 17%|#6 | 16/95 [00:11<00:57, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9421, LAS: 0.8933, UEM: 0.5564, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2379, partial_loss/deprel_loss: 0.9064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1657, loss: 0.7891, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||: 20%|## | 19/95 [00:13<00:54, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9423, LAS: 0.8934, UEM: 0.5402, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7128, partial_loss/deprel_loss: 0.6937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8906, loss: 0.7904, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||: 23%|##3 | 22/95 [00:15<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8484, UAS: 0.9418, LAS: 0.8932, UEM: 0.5599, LEM: 0.2998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2771, partial_loss/deprel_loss: 0.8405, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1209, loss: 0.7862, batch_reg_loss: 0.1931, reg_loss: 0.1929 ||: 26%|##6 | 25/95 [00:18<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9440, LAS: 0.8952, UEM: 0.5799, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2042, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5741, loss: 0.7691, batch_reg_loss: 0.1931, reg_loss: 0.1930 ||: 29%|##9 | 28/95 [00:20<00:47, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.9391, LAS: 0.8896, UEM: 0.5604, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2063, partial_loss/deprel_loss: 0.8403, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1066, loss: 0.8119, batch_reg_loss: 0.1932, reg_loss: 0.1930 ||: 33%|###2 | 31/95 [00:22<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9401, LAS: 0.8910, UEM: 0.5682, LEM: 0.3108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4735, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.8022, batch_reg_loss: 0.1932, reg_loss: 0.1930 ||: 37%|###6 | 35/95 [00:24<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9409, LAS: 0.8918, UEM: 0.5754, LEM: 0.3143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5804, partial_loss/deprel_loss: 0.6790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8525, loss: 0.7963, batch_reg_loss: 0.1933, reg_loss: 0.1930 ||: 41%|####1 | 39/95 [00:27<00:36, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9411, LAS: 0.8918, UEM: 0.5984, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5573, partial_loss/deprel_loss: 0.6468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8222, loss: 0.7981, batch_reg_loss: 0.1933, reg_loss: 0.1931 ||: 45%|####5 | 43/95 [00:30<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9422, LAS: 0.8928, UEM: 0.5970, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2616, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 0.7911, batch_reg_loss: 0.1934, reg_loss: 0.1931 ||: 49%|####9 | 47/95 [00:32<00:30, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9429, LAS: 0.8933, UEM: 0.5970, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1733, partial_loss/deprel_loss: 0.3771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5298, loss: 0.7856, batch_reg_loss: 0.1934, reg_loss: 0.1931 ||: 55%|#####4 | 52/95 [00:34<00:25, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9439, LAS: 0.8947, UEM: 0.6059, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.6443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8198, loss: 0.7756, batch_reg_loss: 0.1935, reg_loss: 0.1931 ||: 59%|#####8 | 56/95 [00:37<00:24, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9433, LAS: 0.8941, UEM: 0.6199, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.5503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7207, loss: 0.7750, batch_reg_loss: 0.1935, reg_loss: 0.1932 ||: 63%|######3 | 60/95 [00:40<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9426, LAS: 0.8932, UEM: 0.6076, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6869, partial_loss/deprel_loss: 0.7540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9341, loss: 0.7818, batch_reg_loss: 0.1935, reg_loss: 0.1932 ||: 67%|######7 | 64/95 [00:42<00:19, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9431, LAS: 0.8937, UEM: 0.6083, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.7767, batch_reg_loss: 0.1936, reg_loss: 0.1932 ||: 72%|#######1 | 68/95 [00:44<00:16, 1.64it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9429, LAS: 0.8933, UEM: 0.6004, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6285, partial_loss/deprel_loss: 0.7207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8959, loss: 0.7792, batch_reg_loss: 0.1936, reg_loss: 0.1932 ||: 76%|#######5 | 72/95 [00:47<00:13, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9424, LAS: 0.8927, UEM: 0.5996, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.4595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6088, loss: 0.7833, batch_reg_loss: 0.1937, reg_loss: 0.1933 ||: 81%|########1 | 77/95 [00:49<00:10, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9417, LAS: 0.8918, UEM: 0.5899, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8107, partial_loss/deprel_loss: 0.7399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9478, loss: 0.7908, batch_reg_loss: 0.1938, reg_loss: 0.1933 ||: 86%|########6 | 82/95 [00:51<00:06, 1.92it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9407, LAS: 0.8907, UEM: 0.5812, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9775, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8001, batch_reg_loss: 0.1938, reg_loss: 0.1933 ||: 91%|######### | 86/95 [00:54<00:05, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9400, LAS: 0.8900, UEM: 0.5715, LEM: 0.3336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4604, partial_loss/deprel_loss: 0.5352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.8060, batch_reg_loss: 0.1939, reg_loss: 0.1933 ||: 95%|#########4| 90/95 [00:57<00:03, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9401, LAS: 0.8903, UEM: 0.5700, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6862, loss: 0.8044, batch_reg_loss: 0.1939, reg_loss: 0.1934 ||: 99%|#########8| 94/95 [01:00<00:00, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9405, LAS: 0.8907, UEM: 0.5782, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1208, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4714, loss: 0.8009, batch_reg_loss: 0.1940, reg_loss: 0.1934 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - reg_loss | 0.193 | N/A\n", + "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UEM | 0.578 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LEM | 0.339 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.121 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UAS | 0.940 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.317 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LAS | 0.891 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:24:42,023 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:24:42,023 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:24:42,023 - INFO - combo.training.trainer - Epoch duration: 0:01:01.151488\n", + "2023-04-07 00:24:42,023 - INFO - combo.training.trainer - Estimated training time remaining: 5:52:25\n", + "2023-04-07 00:24:42,023 - INFO - allennlp.training.trainer - Epoch 85/399\n", + "2023-04-07 00:24:42,024 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:24:42,024 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:24:42,030 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9466, LAS: 0.8997, UEM: 0.4561, LEM: 0.2193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4473, partial_loss/deprel_loss: 0.5097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6912, loss: 0.7181, batch_reg_loss: 0.1940, reg_loss: 0.1940 ||: 3%|3 | 3/95 [00:02<01:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9368, LAS: 0.8882, UEM: 0.3619, LEM: 0.1613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6710, partial_loss/deprel_loss: 0.7099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.8291, batch_reg_loss: 0.1941, reg_loss: 0.1940 ||: 7%|7 | 7/95 [00:04<00:56, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9316, LAS: 0.8808, UEM: 0.3174, LEM: 0.1327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6454, partial_loss/deprel_loss: 0.6888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8743, loss: 0.8748, batch_reg_loss: 0.1941, reg_loss: 0.1940 ||: 11%|# | 10/95 [00:06<00:55, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9397, LAS: 0.8890, UEM: 0.4730, LEM: 0.2343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2931, partial_loss/deprel_loss: 0.4276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5948, loss: 0.8079, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 14%|#3 | 13/95 [00:08<00:54, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9408, LAS: 0.8907, UEM: 0.4914, LEM: 0.2435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3559, partial_loss/deprel_loss: 0.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6671, loss: 0.7967, batch_reg_loss: 0.1942, reg_loss: 0.1941 ||: 18%|#7 | 17/95 [00:10<00:49, 1.57it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9401, LAS: 0.8899, UEM: 0.4798, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4468, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6375, loss: 0.8073, batch_reg_loss: 0.1943, reg_loss: 0.1941 ||: 22%|##2 | 21/95 [00:13<00:46, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9404, LAS: 0.8903, UEM: 0.5016, LEM: 0.2535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2345, partial_loss/deprel_loss: 0.8768, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1426, loss: 0.8032, batch_reg_loss: 0.1943, reg_loss: 0.1941 ||: 25%|##5 | 24/95 [00:15<00:47, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9419, LAS: 0.8923, UEM: 0.5276, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3129, partial_loss/deprel_loss: 0.4355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6053, loss: 0.7858, batch_reg_loss: 0.1943, reg_loss: 0.1942 ||: 28%|##8 | 27/95 [00:17<00:48, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9422, LAS: 0.8923, UEM: 0.5250, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7323, partial_loss/deprel_loss: 0.6823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8867, loss: 0.7885, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||: 33%|###2 | 31/95 [00:20<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9423, LAS: 0.8925, UEM: 0.5366, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.3853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7862, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||: 36%|###5 | 34/95 [00:22<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9410, LAS: 0.8913, UEM: 0.5240, LEM: 0.2777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.5033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.7934, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||: 39%|###8 | 37/95 [00:25<00:42, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9421, LAS: 0.8924, UEM: 0.5291, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.4049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5757, loss: 0.7884, batch_reg_loss: 0.1945, reg_loss: 0.1942 ||: 43%|####3 | 41/95 [00:27<00:38, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9432, LAS: 0.8933, UEM: 0.5458, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8448, loss: 0.7791, batch_reg_loss: 0.1945, reg_loss: 0.1943 ||: 46%|####6 | 44/95 [00:29<00:36, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9433, LAS: 0.8932, UEM: 0.5358, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.5005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6861, loss: 0.7829, batch_reg_loss: 0.1945, reg_loss: 0.1943 ||: 51%|##### | 48/95 [00:32<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9437, LAS: 0.8938, UEM: 0.5471, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4086, partial_loss/deprel_loss: 0.5916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7496, loss: 0.7790, batch_reg_loss: 0.1946, reg_loss: 0.1943 ||: 54%|#####3 | 51/95 [00:34<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9440, LAS: 0.8945, UEM: 0.5814, LEM: 0.3416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0533, partial_loss/deprel_loss: 0.1731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3438, loss: 0.7741, batch_reg_loss: 0.1946, reg_loss: 0.1943 ||: 57%|#####6 | 54/95 [00:37<00:30, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9442, LAS: 0.8947, UEM: 0.5798, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.5124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.7741, batch_reg_loss: 0.1947, reg_loss: 0.1943 ||: 61%|######1 | 58/95 [00:39<00:26, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8674, UAS: 0.9429, LAS: 0.8935, UEM: 0.5735, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8163, partial_loss/deprel_loss: 0.7422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9517, loss: 0.7821, batch_reg_loss: 0.1947, reg_loss: 0.1944 ||: 64%|######4 | 61/95 [00:41<00:23, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9431, LAS: 0.8936, UEM: 0.5759, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.5370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6902, loss: 0.7815, batch_reg_loss: 0.1947, reg_loss: 0.1944 ||: 67%|######7 | 64/95 [00:43<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9436, LAS: 0.8942, UEM: 0.5927, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.7782, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||: 71%|####### | 67/95 [00:46<00:20, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9436, LAS: 0.8938, UEM: 0.5873, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5926, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8439, loss: 0.7793, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||: 75%|#######4 | 71/95 [00:48<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9439, LAS: 0.8939, UEM: 0.5835, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5846, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.7786, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||: 79%|#######8 | 75/95 [00:51<00:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.9432, LAS: 0.8934, UEM: 0.5854, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7572, partial_loss/deprel_loss: 1.0228, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3645, loss: 0.7825, batch_reg_loss: 0.1949, reg_loss: 0.1944 ||: 82%|########2 | 78/95 [00:53<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9431, LAS: 0.8933, UEM: 0.5838, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9157, partial_loss/deprel_loss: 0.7864, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.7831, batch_reg_loss: 0.1949, reg_loss: 0.1945 ||: 85%|########5 | 81/95 [00:55<00:09, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9414, LAS: 0.8913, UEM: 0.5762, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8134, partial_loss/deprel_loss: 0.7467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9549, loss: 0.7976, batch_reg_loss: 0.1949, reg_loss: 0.1945 ||: 88%|########8 | 84/95 [00:57<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9408, LAS: 0.8907, UEM: 0.5804, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0394, partial_loss/deprel_loss: 1.1325, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5089, loss: 0.8013, batch_reg_loss: 0.1950, reg_loss: 0.1945 ||: 92%|#########1| 87/95 [00:59<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9410, LAS: 0.8907, UEM: 0.5769, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.8017, batch_reg_loss: 0.1950, reg_loss: 0.1945 ||: 96%|#########5| 91/95 [01:02<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9410, LAS: 0.8908, UEM: 0.5845, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.8013, batch_reg_loss: 0.1951, reg_loss: 0.1945 ||: 100%|##########| 95/95 [01:05<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9410, LAS: 0.8908, UEM: 0.5845, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.8013, batch_reg_loss: 0.1951, reg_loss: 0.1945 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-07 00:25:47,060 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9228, LAS: 0.8633, UEM: 0.3296, LEM: 0.0726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8452, partial_loss/deprel_loss: 32.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 26.3538, loss: 34.2431, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9381, LAS: 0.8814, UEM: 0.5156, LEM: 0.2156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 26.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 21.1049, loss: 27.7967, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:04<00:04, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9497, LAS: 0.8967, UEM: 0.6925, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1871, partial_loss/deprel_loss: 21.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 16.9058, loss: 23.2656, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:07<00:00, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9474, LAS: 0.8946, UEM: 0.6749, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1030, partial_loss/deprel_loss: 45.7873, partial_loss/cycle_loss: 0.0000, batch_loss: 36.8505, loss: 24.5006, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.41it/s]\n", + "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - reg_loss | 0.195 | 0.000\n", + "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UEM | 0.585 | 0.675\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LEM | 0.344 | 0.398\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - EM | 0.916 | 0.874\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.355 | 1.103\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | 0.947\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.488 | 45.787\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - loss | 0.801 | 24.501\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LAS | 0.891 | 0.895\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:25:54,872 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:25:54,872 - INFO - combo.training.trainer - Epoch duration: 0:01:12.848706\n", + "2023-04-07 00:25:54,872 - INFO - combo.training.trainer - Estimated training time remaining: 5:51:38\n", + "2023-04-07 00:25:54,872 - INFO - allennlp.training.trainer - Epoch 86/399\n", + "2023-04-07 00:25:54,873 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:25:54,873 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:25:54,880 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9303, LAS: 0.8790, UEM: 0.5903, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2182, partial_loss/deprel_loss: 0.4540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.8753, batch_reg_loss: 0.1952, reg_loss: 0.1951 ||: 5%|5 | 5/95 [00:02<00:40, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9434, LAS: 0.8926, UEM: 0.6223, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2440, partial_loss/deprel_loss: 0.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.7749, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||: 9%|9 | 9/95 [00:04<00:40, 2.10it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9415, LAS: 0.8907, UEM: 0.6017, LEM: 0.3346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9514, partial_loss/deprel_loss: 0.7318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9710, loss: 0.7896, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||: 13%|#2 | 12/95 [00:06<00:45, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9411, LAS: 0.8912, UEM: 0.5743, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3750, partial_loss/deprel_loss: 0.4740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.7949, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||: 17%|#6 | 16/95 [00:09<00:46, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9423, LAS: 0.8922, UEM: 0.5722, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4842, partial_loss/deprel_loss: 0.5115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7014, loss: 0.7872, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||: 20%|## | 19/95 [00:11<00:47, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9438, LAS: 0.8937, UEM: 0.5861, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3016, partial_loss/deprel_loss: 0.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6089, loss: 0.7726, batch_reg_loss: 0.1954, reg_loss: 0.1952 ||: 23%|##3 | 22/95 [00:14<00:52, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9440, LAS: 0.8947, UEM: 0.5654, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6113, partial_loss/deprel_loss: 0.6593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8451, loss: 0.7651, batch_reg_loss: 0.1954, reg_loss: 0.1953 ||: 27%|##7 | 26/95 [00:16<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9401, LAS: 0.8902, UEM: 0.5559, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3724, partial_loss/deprel_loss: 0.9640, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2411, loss: 0.8040, batch_reg_loss: 0.1954, reg_loss: 0.1953 ||: 31%|### | 29/95 [00:18<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9427, LAS: 0.8938, UEM: 0.6186, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4439, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.7770, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||: 34%|###3 | 32/95 [00:21<00:48, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9427, LAS: 0.8938, UEM: 0.6178, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5841, loss: 0.7726, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||: 37%|###6 | 35/95 [00:23<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9427, LAS: 0.8938, UEM: 0.6098, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7651, partial_loss/deprel_loss: 0.7290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9318, loss: 0.7718, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||: 40%|#### | 38/95 [00:25<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9435, LAS: 0.8944, UEM: 0.6106, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7390, partial_loss/deprel_loss: 0.7182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9179, loss: 0.7679, batch_reg_loss: 0.1956, reg_loss: 0.1954 ||: 43%|####3 | 41/95 [00:28<00:39, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9429, LAS: 0.8935, UEM: 0.5934, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7213, partial_loss/deprel_loss: 0.7034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9026, loss: 0.7772, batch_reg_loss: 0.1956, reg_loss: 0.1954 ||: 47%|####7 | 45/95 [00:30<00:35, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9216, UAS: 0.9438, LAS: 0.8945, UEM: 0.5972, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.7687, batch_reg_loss: 0.1957, reg_loss: 0.1954 ||: 51%|##### | 48/95 [00:32<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9421, LAS: 0.8928, UEM: 0.5813, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5677, partial_loss/deprel_loss: 0.6120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.7809, batch_reg_loss: 0.1957, reg_loss: 0.1954 ||: 55%|#####4 | 52/95 [00:35<00:29, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8515, UAS: 0.9420, LAS: 0.8925, UEM: 0.5764, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9556, partial_loss/deprel_loss: 0.8274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0488, loss: 0.7859, batch_reg_loss: 0.1958, reg_loss: 0.1954 ||: 59%|#####8 | 56/95 [00:37<00:26, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9419, LAS: 0.8923, UEM: 0.5689, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6214, partial_loss/deprel_loss: 0.6430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8345, loss: 0.7897, batch_reg_loss: 0.1958, reg_loss: 0.1955 ||: 63%|######3 | 60/95 [00:40<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9411, LAS: 0.8915, UEM: 0.5695, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1562, partial_loss/deprel_loss: 0.3311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4920, loss: 0.7975, batch_reg_loss: 0.1959, reg_loss: 0.1955 ||: 66%|######6 | 63/95 [00:42<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9412, LAS: 0.8916, UEM: 0.5788, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.7970, batch_reg_loss: 0.1959, reg_loss: 0.1955 ||: 69%|######9 | 66/95 [00:44<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9420, LAS: 0.8924, UEM: 0.5859, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.4007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.7910, batch_reg_loss: 0.1960, reg_loss: 0.1955 ||: 74%|#######3 | 70/95 [00:47<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9424, LAS: 0.8926, UEM: 0.5855, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6856, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8531, loss: 0.7894, batch_reg_loss: 0.1960, reg_loss: 0.1955 ||: 77%|#######6 | 73/95 [00:49<00:15, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9419, LAS: 0.8921, UEM: 0.5873, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.7939, batch_reg_loss: 0.1960, reg_loss: 0.1956 ||: 80%|######## | 76/95 [00:51<00:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9419, LAS: 0.8920, UEM: 0.5851, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.9078, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1329, loss: 0.7961, batch_reg_loss: 0.1961, reg_loss: 0.1956 ||: 84%|########4 | 80/95 [00:54<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9415, LAS: 0.8915, UEM: 0.5799, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8618, partial_loss/deprel_loss: 0.7938, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0035, loss: 0.8000, batch_reg_loss: 0.1961, reg_loss: 0.1956 ||: 87%|########7 | 83/95 [00:56<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9413, LAS: 0.8911, UEM: 0.5741, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8762, partial_loss/deprel_loss: 0.7787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9944, loss: 0.8044, batch_reg_loss: 0.1962, reg_loss: 0.1956 ||: 92%|#########1| 87/95 [00:58<00:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9415, LAS: 0.8913, UEM: 0.5878, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4850, partial_loss/deprel_loss: 0.5832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7597, loss: 0.8039, batch_reg_loss: 0.1962, reg_loss: 0.1957 ||: 96%|#########5| 91/95 [01:02<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9417, LAS: 0.8914, UEM: 0.5839, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4754, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8023, batch_reg_loss: 0.1963, reg_loss: 0.1957 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9417, LAS: 0.8914, UEM: 0.5839, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4754, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8023, batch_reg_loss: 0.1963, reg_loss: 0.1957 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - reg_loss | 0.196 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - LEM | 0.344 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EM | 0.893 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.475 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.564 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - LAS | 0.891 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:26:59,581 - INFO - combo.training.trainer - Epoch duration: 0:01:04.708363\n", + "2023-04-07 00:26:59,581 - INFO - combo.training.trainer - Estimated training time remaining: 5:50:22\n", + "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - Epoch 87/399\n", + "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:26:59,588 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9615, LAS: 0.9135, UEM: 0.6192, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3482, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.6525, batch_reg_loss: 0.1963, reg_loss: 0.1963 ||: 4%|4 | 4/95 [00:02<00:49, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9525, LAS: 0.9039, UEM: 0.5553, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6272, loss: 0.7114, batch_reg_loss: 0.1963, reg_loss: 0.1963 ||: 7%|7 | 7/95 [00:04<00:53, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9434, LAS: 0.8928, UEM: 0.5168, LEM: 0.2456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3595, partial_loss/deprel_loss: 0.9489, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2274, loss: 0.7922, batch_reg_loss: 0.1964, reg_loss: 0.1963 ||: 11%|# | 10/95 [00:06<00:53, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9357, LAS: 0.8853, UEM: 0.5261, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5121, loss: 0.8409, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 15%|#4 | 14/95 [00:09<00:51, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9392, LAS: 0.8890, UEM: 0.5406, LEM: 0.2792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.4373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.8206, batch_reg_loss: 0.1965, reg_loss: 0.1964 ||: 19%|#8 | 18/95 [00:11<00:49, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9399, LAS: 0.8901, UEM: 0.5422, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4526, partial_loss/deprel_loss: 0.5380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7175, loss: 0.8118, batch_reg_loss: 0.1965, reg_loss: 0.1964 ||: 22%|##2 | 21/95 [00:13<00:48, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9409, LAS: 0.8908, UEM: 0.5386, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2947, partial_loss/deprel_loss: 0.4101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.8113, batch_reg_loss: 0.1966, reg_loss: 0.1964 ||: 26%|##6 | 25/95 [00:16<00:44, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9423, LAS: 0.8922, UEM: 0.5240, LEM: 0.2676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5496, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8237, loss: 0.8047, batch_reg_loss: 0.1966, reg_loss: 0.1965 ||: 32%|###1 | 30/95 [00:18<00:37, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9406, LAS: 0.8905, UEM: 0.5147, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5974, partial_loss/deprel_loss: 0.6037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 0.8168, batch_reg_loss: 0.1967, reg_loss: 0.1965 ||: 37%|###6 | 35/95 [00:20<00:32, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9417, LAS: 0.8920, UEM: 0.5224, LEM: 0.2722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3679, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6711, loss: 0.8073, batch_reg_loss: 0.1968, reg_loss: 0.1965 ||: 42%|####2 | 40/95 [00:23<00:28, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9440, LAS: 0.8946, UEM: 0.5725, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4801, loss: 0.7860, batch_reg_loss: 0.1968, reg_loss: 0.1965 ||: 46%|####6 | 44/95 [00:25<00:26, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9447, LAS: 0.8956, UEM: 0.5881, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5514, loss: 0.7778, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||: 51%|##### | 48/95 [00:28<00:28, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9442, LAS: 0.8951, UEM: 0.5793, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5449, loss: 0.7808, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||: 55%|#####4 | 52/95 [00:31<00:26, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9433, LAS: 0.8942, UEM: 0.5829, LEM: 0.3378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6835, partial_loss/deprel_loss: 1.0484, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3723, loss: 0.7876, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9443, LAS: 0.8949, UEM: 0.5903, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.4897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.7808, batch_reg_loss: 0.1970, reg_loss: 0.1966 ||: 63%|######3 | 60/95 [00:37<00:25, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9443, LAS: 0.8949, UEM: 0.5840, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3851, partial_loss/deprel_loss: 0.5246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6937, loss: 0.7806, batch_reg_loss: 0.1970, reg_loss: 0.1967 ||: 67%|######7 | 64/95 [00:40<00:22, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9443, LAS: 0.8950, UEM: 0.5846, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.7800, batch_reg_loss: 0.1971, reg_loss: 0.1967 ||: 72%|#######1 | 68/95 [00:42<00:18, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9439, LAS: 0.8946, UEM: 0.5818, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0211, partial_loss/deprel_loss: 0.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.7833, batch_reg_loss: 0.1971, reg_loss: 0.1967 ||: 75%|#######4 | 71/95 [00:45<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8461, UAS: 0.9427, LAS: 0.8933, UEM: 0.5758, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2804, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1329, loss: 0.7921, batch_reg_loss: 0.1972, reg_loss: 0.1967 ||: 79%|#######8 | 75/95 [00:47<00:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9426, LAS: 0.8932, UEM: 0.5802, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3690, partial_loss/deprel_loss: 0.8747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1707, loss: 0.7923, batch_reg_loss: 0.1972, reg_loss: 0.1967 ||: 82%|########2 | 78/95 [00:49<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9424, LAS: 0.8930, UEM: 0.5744, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6648, partial_loss/deprel_loss: 0.6441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8455, loss: 0.7947, batch_reg_loss: 0.1972, reg_loss: 0.1968 ||: 85%|########5 | 81/95 [00:51<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9427, LAS: 0.8933, UEM: 0.5824, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3121, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6493, loss: 0.7919, batch_reg_loss: 0.1973, reg_loss: 0.1968 ||: 88%|########8 | 84/95 [00:54<00:08, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9424, LAS: 0.8929, UEM: 0.5754, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8627, partial_loss/deprel_loss: 0.8393, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0413, loss: 0.7959, batch_reg_loss: 0.1973, reg_loss: 0.1968 ||: 92%|#########1| 87/95 [00:56<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9418, LAS: 0.8922, UEM: 0.5728, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8800, partial_loss/deprel_loss: 0.7644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9849, loss: 0.8008, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||: 96%|#########5| 91/95 [00:58<00:02, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9425, LAS: 0.8930, UEM: 0.5869, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0619, partial_loss/deprel_loss: 0.1758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7957, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||: 100%|##########| 95/95 [01:01<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9425, LAS: 0.8930, UEM: 0.5869, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0619, partial_loss/deprel_loss: 0.1758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7957, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - reg_loss | 0.197 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UEM | 0.587 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - LEM | 0.347 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EM | 0.951 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.062 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.176 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - loss | 0.796 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - LAS | 0.893 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:01,205 - INFO - combo.training.trainer - Epoch duration: 0:01:01.623636\n", + "2023-04-07 00:28:01,205 - INFO - combo.training.trainer - Estimated training time remaining: 5:48:55\n", + "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - Epoch 88/399\n", + "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:28:01,211 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9353, LAS: 0.8842, UEM: 0.4656, LEM: 0.2133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9636, partial_loss/deprel_loss: 0.8324, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0561, loss: 0.8300, batch_reg_loss: 0.1975, reg_loss: 0.1975 ||: 3%|3 | 3/95 [00:02<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9345, LAS: 0.8837, UEM: 0.4115, LEM: 0.1826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3071, partial_loss/deprel_loss: 0.8828, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1652, loss: 0.8505, batch_reg_loss: 0.1975, reg_loss: 0.1975 ||: 7%|7 | 7/95 [00:04<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9450, LAS: 0.8953, UEM: 0.5579, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3981, partial_loss/deprel_loss: 0.4900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7676, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||: 11%|# | 10/95 [00:06<01:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9481, LAS: 0.8994, UEM: 0.5789, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.4957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.7347, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||: 14%|#3 | 13/95 [00:09<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9512, LAS: 0.9047, UEM: 0.6611, LEM: 0.4402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6081, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8793, loss: 0.7090, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||: 17%|#6 | 16/95 [00:11<01:00, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9520, LAS: 0.9051, UEM: 0.6520, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3609, partial_loss/deprel_loss: 0.4233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.7045, batch_reg_loss: 0.1976, reg_loss: 0.1976 ||: 20%|## | 19/95 [00:13<00:58, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9511, LAS: 0.9039, UEM: 0.6374, LEM: 0.4072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2298, partial_loss/deprel_loss: 0.3898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.7115, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||: 24%|##4 | 23/95 [00:16<00:54, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9472, LAS: 0.8994, UEM: 0.6104, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0077, partial_loss/deprel_loss: 0.8336, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0661, loss: 0.7468, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||: 28%|##8 | 27/95 [00:19<00:49, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9473, LAS: 0.8991, UEM: 0.6025, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8486, loss: 0.7498, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||: 33%|###2 | 31/95 [00:22<00:44, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9438, LAS: 0.8954, UEM: 0.5855, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9936, partial_loss/deprel_loss: 0.9843, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3839, loss: 0.7738, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||: 36%|###5 | 34/95 [00:24<00:43, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9240, UAS: 0.9449, LAS: 0.8968, UEM: 0.5936, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.3521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.7618, batch_reg_loss: 0.1978, reg_loss: 0.1976 ||: 39%|###8 | 37/95 [00:26<00:42, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8425, UAS: 0.9435, LAS: 0.8951, UEM: 0.5877, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2622, partial_loss/deprel_loss: 0.9161, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1831, loss: 0.7751, batch_reg_loss: 0.1978, reg_loss: 0.1976 ||: 42%|####2 | 40/95 [00:28<00:40, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9431, LAS: 0.8944, UEM: 0.5807, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4448, partial_loss/deprel_loss: 0.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7923, loss: 0.7778, batch_reg_loss: 0.1978, reg_loss: 0.1977 ||: 45%|####5 | 43/95 [00:31<00:39, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9427, LAS: 0.8940, UEM: 0.5724, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7533, partial_loss/deprel_loss: 0.6934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9033, loss: 0.7822, batch_reg_loss: 0.1979, reg_loss: 0.1977 ||: 49%|####9 | 47/95 [00:33<00:34, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9435, LAS: 0.8949, UEM: 0.5817, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2394, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.7740, batch_reg_loss: 0.1979, reg_loss: 0.1977 ||: 53%|#####2 | 50/95 [00:36<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9415, LAS: 0.8927, UEM: 0.5700, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4372, partial_loss/deprel_loss: 1.0914, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3585, loss: 0.7914, batch_reg_loss: 0.1980, reg_loss: 0.1977 ||: 56%|#####5 | 53/95 [00:38<00:30, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9413, LAS: 0.8922, UEM: 0.5691, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5933, loss: 0.7934, batch_reg_loss: 0.1980, reg_loss: 0.1977 ||: 59%|#####8 | 56/95 [00:40<00:28, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9411, LAS: 0.8918, UEM: 0.5593, LEM: 0.3255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8201, partial_loss/deprel_loss: 0.6674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8960, loss: 0.7948, batch_reg_loss: 0.1981, reg_loss: 0.1977 ||: 64%|######4 | 61/95 [00:42<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9403, LAS: 0.8908, UEM: 0.5581, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1353, partial_loss/deprel_loss: 0.3320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.8029, batch_reg_loss: 0.1981, reg_loss: 0.1978 ||: 69%|######9 | 66/95 [00:45<00:17, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.9406, LAS: 0.8907, UEM: 0.5623, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0894, partial_loss/deprel_loss: 0.9622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1858, loss: 0.8026, batch_reg_loss: 0.1982, reg_loss: 0.1978 ||: 75%|#######4 | 71/95 [00:47<00:13, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9408, LAS: 0.8909, UEM: 0.5787, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1041, partial_loss/deprel_loss: 0.2437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4141, loss: 0.8013, batch_reg_loss: 0.1983, reg_loss: 0.1978 ||: 80%|######## | 76/95 [00:50<00:10, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9404, LAS: 0.8905, UEM: 0.5721, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6706, partial_loss/deprel_loss: 0.6264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.8033, batch_reg_loss: 0.1983, reg_loss: 0.1979 ||: 84%|########4 | 80/95 [00:52<00:08, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9411, LAS: 0.8912, UEM: 0.5771, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.5852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7394, loss: 0.7981, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||: 88%|########8 | 84/95 [00:55<00:06, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9412, LAS: 0.8912, UEM: 0.5732, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4024, partial_loss/deprel_loss: 0.5715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8009, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||: 93%|#########2| 88/95 [00:58<00:04, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9422, LAS: 0.8921, UEM: 0.5884, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1376, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4839, loss: 0.7930, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||: 97%|#########6| 92/95 [01:00<00:01, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9420, LAS: 0.8917, UEM: 0.5827, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6680, partial_loss/deprel_loss: 0.7358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9207, loss: 0.7973, batch_reg_loss: 0.1985, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:29:04,015 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - reg_loss | 0.198 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - LEM | 0.345 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EM | 0.884 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.668 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.736 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - loss | 0.797 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:29:04,017 - INFO - combo.training.trainer - Epoch duration: 0:01:02.812578\n", + "2023-04-07 00:29:04,018 - INFO - combo.training.trainer - Estimated training time remaining: 5:47:33\n", + "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - Epoch 89/399\n", + "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:29:04,025 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9481, LAS: 0.9035, UEM: 0.4851, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5204, partial_loss/deprel_loss: 0.5339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7297, loss: 0.7150, batch_reg_loss: 0.1985, reg_loss: 0.1985 ||: 3%|3 | 3/95 [00:02<01:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9456, LAS: 0.8989, UEM: 0.4396, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4658, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.7531, batch_reg_loss: 0.1985, reg_loss: 0.1985 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9442, LAS: 0.8966, UEM: 0.4105, LEM: 0.1650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7382, partial_loss/deprel_loss: 0.7128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9165, loss: 0.7817, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||: 11%|# | 10/95 [00:06<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9434, LAS: 0.8962, UEM: 0.4338, LEM: 0.1837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5118, partial_loss/deprel_loss: 0.5192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7163, loss: 0.7785, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||: 14%|#3 | 13/95 [00:08<00:56, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9447, LAS: 0.8973, UEM: 0.4778, LEM: 0.2194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.4379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6080, loss: 0.7694, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||: 17%|#6 | 16/95 [00:11<00:56, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9442, LAS: 0.8967, UEM: 0.5127, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4065, partial_loss/deprel_loss: 0.4926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.7751, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||: 20%|## | 19/95 [00:13<00:55, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9470, LAS: 0.8991, UEM: 0.5595, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6297, loss: 0.7508, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||: 23%|##3 | 22/95 [00:16<00:55, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9477, LAS: 0.8998, UEM: 0.5598, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6401, partial_loss/deprel_loss: 0.6176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8208, loss: 0.7474, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||: 26%|##6 | 25/95 [00:18<00:51, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9437, LAS: 0.8956, UEM: 0.5304, LEM: 0.2771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4528, partial_loss/deprel_loss: 0.5562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7343, loss: 0.7814, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||: 31%|### | 29/95 [00:20<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8773, UAS: 0.9447, LAS: 0.8961, UEM: 0.5438, LEM: 0.2865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6302, partial_loss/deprel_loss: 0.6282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8274, loss: 0.7733, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||: 34%|###3 | 32/95 [00:23<00:46, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9434, LAS: 0.8946, UEM: 0.5375, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5787, partial_loss/deprel_loss: 0.6191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8098, loss: 0.7841, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||: 38%|###7 | 36/95 [00:25<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9428, LAS: 0.8936, UEM: 0.5350, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.7361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9075, loss: 0.7898, batch_reg_loss: 0.1989, reg_loss: 0.1987 ||: 42%|####2 | 40/95 [00:28<00:38, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9414, LAS: 0.8919, UEM: 0.5269, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9567, partial_loss/deprel_loss: 0.8349, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0581, loss: 0.8030, batch_reg_loss: 0.1989, reg_loss: 0.1987 ||: 46%|####6 | 44/95 [00:31<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9420, LAS: 0.8931, UEM: 0.5699, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2347, partial_loss/deprel_loss: 0.3596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5336, loss: 0.7941, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||: 49%|####9 | 47/95 [00:33<00:35, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9396, LAS: 0.8906, UEM: 0.5562, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0159, partial_loss/deprel_loss: 0.8514, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0833, loss: 0.8123, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||: 53%|#####2 | 50/95 [00:35<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8634, UAS: 0.9394, LAS: 0.8902, UEM: 0.5621, LEM: 0.3331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9020, partial_loss/deprel_loss: 0.7869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0089, loss: 0.8138, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||: 56%|#####5 | 53/95 [00:37<00:30, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9405, LAS: 0.8913, UEM: 0.5770, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1214, partial_loss/deprel_loss: 0.2771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.8053, batch_reg_loss: 0.1991, reg_loss: 0.1988 ||: 59%|#####8 | 56/95 [00:40<00:29, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9407, LAS: 0.8914, UEM: 0.5740, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.8043, batch_reg_loss: 0.1991, reg_loss: 0.1988 ||: 62%|######2 | 59/95 [00:42<00:26, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9388, LAS: 0.8892, UEM: 0.5662, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3096, partial_loss/deprel_loss: 0.8764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1622, loss: 0.8187, batch_reg_loss: 0.1992, reg_loss: 0.1988 ||: 65%|######5 | 62/95 [00:44<00:23, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9393, LAS: 0.8896, UEM: 0.5640, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.5068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6617, loss: 0.8159, batch_reg_loss: 0.1992, reg_loss: 0.1988 ||: 69%|######9 | 66/95 [00:46<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9396, LAS: 0.8899, UEM: 0.5684, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2685, partial_loss/deprel_loss: 0.3919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5665, loss: 0.8126, batch_reg_loss: 0.1993, reg_loss: 0.1988 ||: 74%|#######3 | 70/95 [00:49<00:16, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9406, LAS: 0.8911, UEM: 0.5816, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5669, partial_loss/deprel_loss: 0.6554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8370, loss: 0.8050, batch_reg_loss: 0.1993, reg_loss: 0.1989 ||: 78%|#######7 | 74/95 [00:52<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9397, LAS: 0.8902, UEM: 0.5767, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4900, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7292, loss: 0.8124, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||: 81%|########1 | 77/95 [00:54<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9408, LAS: 0.8914, UEM: 0.5873, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2311, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.8032, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||: 84%|########4 | 80/95 [00:56<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9411, LAS: 0.8917, UEM: 0.5851, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3257, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.8013, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||: 87%|########7 | 83/95 [00:58<00:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9405, LAS: 0.8909, UEM: 0.5781, LEM: 0.3464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0019, partial_loss/deprel_loss: 0.7952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.8081, batch_reg_loss: 0.1995, reg_loss: 0.1989 ||: 92%|#########1| 87/95 [01:01<00:05, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9401, LAS: 0.8905, UEM: 0.5735, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8329, loss: 0.8110, batch_reg_loss: 0.1995, reg_loss: 0.1990 ||: 95%|#########4| 90/95 [01:03<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9411, LAS: 0.8917, UEM: 0.5826, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8023, batch_reg_loss: 0.1996, reg_loss: 0.1990 ||: 100%|##########| 95/95 [01:05<00:00, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9411, LAS: 0.8917, UEM: 0.5826, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8023, batch_reg_loss: 0.1996, reg_loss: 0.1990 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - reg_loss | 0.199 | N/A\n", + "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LEM | 0.351 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - EM | 0.914 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.242 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.421 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:09,659 - INFO - combo.training.trainer - Epoch duration: 0:01:05.641583\n", + "2023-04-07 00:30:09,659 - INFO - combo.training.trainer - Estimated training time remaining: 5:46:21\n", + "2023-04-07 00:30:09,659 - INFO - allennlp.training.trainer - Epoch 90/399\n", + "2023-04-07 00:30:09,660 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:30:09,660 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:30:09,667 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9450, LAS: 0.8936, UEM: 0.5123, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7253, partial_loss/deprel_loss: 0.6645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.7937, batch_reg_loss: 0.1996, reg_loss: 0.1996 ||: 5%|5 | 5/95 [00:02<00:42, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9427, LAS: 0.8942, UEM: 0.5429, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4502, partial_loss/deprel_loss: 0.4530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6521, loss: 0.7870, batch_reg_loss: 0.1997, reg_loss: 0.1996 ||: 11%|# | 10/95 [00:04<00:39, 2.14it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9460, LAS: 0.8988, UEM: 0.5889, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5685, loss: 0.7484, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||: 15%|#4 | 14/95 [00:07<00:41, 1.96it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9508, LAS: 0.9035, UEM: 0.6386, LEM: 0.3827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.3739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.7130, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||: 19%|#8 | 18/95 [00:09<00:43, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9519, LAS: 0.9046, UEM: 0.6384, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2246, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5487, loss: 0.7054, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||: 22%|##2 | 21/95 [00:12<00:47, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9489, LAS: 0.9007, UEM: 0.6122, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0449, partial_loss/deprel_loss: 0.8457, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0853, loss: 0.7370, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||: 25%|##5 | 24/95 [00:14<00:46, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9482, LAS: 0.8997, UEM: 0.6132, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0205, partial_loss/deprel_loss: 0.8360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0728, loss: 0.7427, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||: 29%|##9 | 28/95 [00:16<00:43, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9476, LAS: 0.8990, UEM: 0.5980, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3960, partial_loss/deprel_loss: 0.4589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.7487, batch_reg_loss: 0.1999, reg_loss: 0.1997 ||: 33%|###2 | 31/95 [00:18<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9457, LAS: 0.8969, UEM: 0.5970, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6791, loss: 0.7626, batch_reg_loss: 0.1999, reg_loss: 0.1998 ||: 36%|###5 | 34/95 [00:21<00:41, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9449, LAS: 0.8961, UEM: 0.5941, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.4196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.7677, batch_reg_loss: 0.1999, reg_loss: 0.1998 ||: 40%|#### | 38/95 [00:23<00:38, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9417, LAS: 0.8924, UEM: 0.5785, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9151, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9727, loss: 0.7963, batch_reg_loss: 0.2000, reg_loss: 0.1998 ||: 43%|####3 | 41/95 [00:25<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9403, LAS: 0.8911, UEM: 0.5619, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1120, partial_loss/deprel_loss: 0.7932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0570, loss: 0.8087, batch_reg_loss: 0.2000, reg_loss: 0.1998 ||: 47%|####7 | 45/95 [00:28<00:32, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9415, LAS: 0.8924, UEM: 0.5658, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3023, partial_loss/deprel_loss: 0.5293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6840, loss: 0.7983, batch_reg_loss: 0.2001, reg_loss: 0.1998 ||: 52%|#####1 | 49/95 [00:30<00:29, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9432, LAS: 0.8943, UEM: 0.5872, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1945, partial_loss/deprel_loss: 0.2997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4789, loss: 0.7849, batch_reg_loss: 0.2002, reg_loss: 0.1999 ||: 56%|#####5 | 53/95 [00:33<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.9423, LAS: 0.8932, UEM: 0.5780, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2293, partial_loss/deprel_loss: 0.9079, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1724, loss: 0.7951, batch_reg_loss: 0.2002, reg_loss: 0.1999 ||: 60%|###### | 57/95 [00:36<00:25, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9628, UAS: 0.9417, LAS: 0.8928, UEM: 0.5927, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0499, partial_loss/deprel_loss: 0.1731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.7994, batch_reg_loss: 0.2003, reg_loss: 0.1999 ||: 64%|######4 | 61/95 [00:39<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9412, LAS: 0.8921, UEM: 0.5921, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2756, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6002, loss: 0.8031, batch_reg_loss: 0.2003, reg_loss: 0.1999 ||: 67%|######7 | 64/95 [00:42<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9423, LAS: 0.8931, UEM: 0.6025, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3239, partial_loss/deprel_loss: 0.5025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6671, loss: 0.7938, batch_reg_loss: 0.2004, reg_loss: 0.1999 ||: 71%|####### | 67/95 [00:44<00:21, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9422, LAS: 0.8929, UEM: 0.6057, LEM: 0.3713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5660, partial_loss/deprel_loss: 0.5883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7842, loss: 0.7939, batch_reg_loss: 0.2004, reg_loss: 0.2000 ||: 74%|#######3 | 70/95 [00:46<00:19, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9420, LAS: 0.8928, UEM: 0.6053, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.4256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.7944, batch_reg_loss: 0.2004, reg_loss: 0.2000 ||: 77%|#######6 | 73/95 [00:48<00:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9422, LAS: 0.8928, UEM: 0.5995, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.7004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.7949, batch_reg_loss: 0.2005, reg_loss: 0.2000 ||: 80%|######## | 76/95 [00:50<00:13, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9424, LAS: 0.8932, UEM: 0.6052, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0929, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4069, loss: 0.7926, batch_reg_loss: 0.2005, reg_loss: 0.2000 ||: 83%|########3 | 79/95 [00:53<00:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9423, LAS: 0.8931, UEM: 0.5989, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6515, partial_loss/deprel_loss: 0.8085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9777, loss: 0.7942, batch_reg_loss: 0.2006, reg_loss: 0.2000 ||: 87%|########7 | 83/95 [00:55<00:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9423, LAS: 0.8929, UEM: 0.5913, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8163, partial_loss/deprel_loss: 0.6959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9206, loss: 0.7933, batch_reg_loss: 0.2006, reg_loss: 0.2001 ||: 92%|#########1| 87/95 [00:58<00:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9423, LAS: 0.8929, UEM: 0.5877, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6205, loss: 0.7947, batch_reg_loss: 0.2006, reg_loss: 0.2001 ||: 96%|#########5| 91/95 [01:00<00:02, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9417, LAS: 0.8922, UEM: 0.5804, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.8000, batch_reg_loss: 0.2007, reg_loss: 0.2001 ||: 100%|##########| 95/95 [01:03<00:00, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9417, LAS: 0.8922, UEM: 0.5804, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.8000, batch_reg_loss: 0.2007, reg_loss: 0.2001 ||: 100%|##########| 95/95 [01:03<00:00, 1.51it/s]\n", + "2023-04-07 00:31:12,789 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9410, LAS: 0.8857, UEM: 0.4621, LEM: 0.1514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 31.5549, partial_loss/cycle_loss: 0.0000, batch_loss: 25.4141, loss: 21.2894, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9450, LAS: 0.8936, UEM: 0.6514, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1134, partial_loss/deprel_loss: 43.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 35.0502, loss: 21.7831, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9368, LAS: 0.8826, UEM: 0.5799, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5046, partial_loss/deprel_loss: 49.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 39.8689, loss: 25.7462, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9441, LAS: 0.8900, UEM: 0.6513, LEM: 0.3949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4922, partial_loss/deprel_loss: 26.0854, partial_loss/cycle_loss: 0.0000, batch_loss: 20.9668, loss: 24.0852, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:09<00:02, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9477, LAS: 0.8952, UEM: 0.6692, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3859, partial_loss/deprel_loss: 21.0911, partial_loss/cycle_loss: 0.0000, batch_loss: 16.9501, loss: 23.0576, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00, 1.00s/it]\n", + "2023-04-07 00:31:23,825 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - reg_loss | 0.200 | 0.000\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UEM | 0.580 | 0.669\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - LEM | 0.347 | 0.406\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EM | 0.897 | 0.918\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.473 | 0.386\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | 0.948\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.581 | 21.091\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - loss | 0.800 | 23.058\n", + "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | 0.895\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:23,828 - INFO - combo.training.trainer - Epoch duration: 0:01:14.168224\n", + "2023-04-07 00:31:23,828 - INFO - combo.training.trainer - Estimated training time remaining: 5:45:39\n", + "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - Epoch 91/399\n", + "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:31:23,836 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9371, LAS: 0.8873, UEM: 0.5567, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2762, partial_loss/deprel_loss: 0.9301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2001, loss: 0.8243, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||: 4%|4 | 4/95 [00:02<00:57, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9257, LAS: 0.8748, UEM: 0.4554, LEM: 0.2406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5300, partial_loss/deprel_loss: 0.5716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.9286, batch_reg_loss: 0.2008, reg_loss: 0.2007 ||: 7%|7 | 7/95 [00:04<00:56, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9312, LAS: 0.8795, UEM: 0.4493, LEM: 0.2157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4770, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.9050, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||: 12%|#1 | 11/95 [00:07<00:53, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9337, LAS: 0.8820, UEM: 0.4745, LEM: 0.2472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9149, partial_loss/deprel_loss: 0.8923, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0978, loss: 0.8786, batch_reg_loss: 0.2009, reg_loss: 0.2008 ||: 17%|#6 | 16/95 [00:09<00:46, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9357, LAS: 0.8855, UEM: 0.5141, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1272, partial_loss/deprel_loss: 0.2702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4426, loss: 0.8593, batch_reg_loss: 0.2010, reg_loss: 0.2008 ||: 22%|##2 | 21/95 [00:11<00:41, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9367, LAS: 0.8866, UEM: 0.5174, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0210, partial_loss/deprel_loss: 0.8528, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0875, loss: 0.8502, batch_reg_loss: 0.2011, reg_loss: 0.2009 ||: 26%|##6 | 25/95 [00:14<00:42, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9350, LAS: 0.8844, UEM: 0.4910, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9201, partial_loss/deprel_loss: 0.8418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0586, loss: 0.8664, batch_reg_loss: 0.2011, reg_loss: 0.2009 ||: 31%|### | 29/95 [00:16<00:39, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9362, LAS: 0.8850, UEM: 0.5022, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5716, partial_loss/deprel_loss: 0.6732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.8630, batch_reg_loss: 0.2012, reg_loss: 0.2009 ||: 35%|###4 | 33/95 [00:19<00:36, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9373, LAS: 0.8861, UEM: 0.4997, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7257, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8128, loss: 0.8521, batch_reg_loss: 0.2012, reg_loss: 0.2010 ||: 39%|###8 | 37/95 [00:21<00:34, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9377, LAS: 0.8863, UEM: 0.5018, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5346, partial_loss/deprel_loss: 0.6944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8637, loss: 0.8491, batch_reg_loss: 0.2013, reg_loss: 0.2010 ||: 43%|####3 | 41/95 [00:23<00:30, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9386, LAS: 0.8873, UEM: 0.5077, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3799, partial_loss/deprel_loss: 0.5438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.8409, batch_reg_loss: 0.2013, reg_loss: 0.2010 ||: 47%|####7 | 45/95 [00:25<00:27, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8428, UAS: 0.9375, LAS: 0.8861, UEM: 0.5085, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3011, partial_loss/deprel_loss: 0.9288, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2046, loss: 0.8502, batch_reg_loss: 0.2014, reg_loss: 0.2010 ||: 52%|#####1 | 49/95 [00:27<00:24, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9384, LAS: 0.8875, UEM: 0.5119, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8223, loss: 0.8384, batch_reg_loss: 0.2014, reg_loss: 0.2011 ||: 56%|#####5 | 53/95 [00:30<00:24, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9405, LAS: 0.8896, UEM: 0.5428, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1974, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5803, loss: 0.8211, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||: 60%|###### | 57/95 [00:33<00:22, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9399, LAS: 0.8888, UEM: 0.5363, LEM: 0.2924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.4788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.8269, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||: 64%|######4 | 61/95 [00:36<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9406, LAS: 0.8896, UEM: 0.5465, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3062, partial_loss/deprel_loss: 0.5368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6922, loss: 0.8216, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||: 68%|######8 | 65/95 [00:39<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9390, LAS: 0.8876, UEM: 0.5362, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7500, loss: 0.8364, batch_reg_loss: 0.2016, reg_loss: 0.2012 ||: 73%|#######2 | 69/95 [00:41<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9397, LAS: 0.8884, UEM: 0.5377, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4453, partial_loss/deprel_loss: 0.5649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.8307, batch_reg_loss: 0.2016, reg_loss: 0.2012 ||: 77%|#######6 | 73/95 [00:44<00:14, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9408, LAS: 0.8897, UEM: 0.5490, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.5402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6907, loss: 0.8207, batch_reg_loss: 0.2017, reg_loss: 0.2012 ||: 81%|########1 | 77/95 [00:46<00:11, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9404, LAS: 0.8891, UEM: 0.5405, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9738, partial_loss/deprel_loss: 0.8144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0480, loss: 0.8244, batch_reg_loss: 0.2017, reg_loss: 0.2012 ||: 85%|########5 | 81/95 [00:49<00:09, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9405, LAS: 0.8894, UEM: 0.5521, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7789, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9885, loss: 0.8224, batch_reg_loss: 0.2018, reg_loss: 0.2013 ||: 89%|########9 | 85/95 [00:51<00:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9407, LAS: 0.8896, UEM: 0.5525, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.8202, batch_reg_loss: 0.2018, reg_loss: 0.2013 ||: 94%|#########3| 89/95 [00:54<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9415, LAS: 0.8907, UEM: 0.5746, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6793, partial_loss/deprel_loss: 0.6564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8628, loss: 0.8122, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||: 97%|#########6| 92/95 [00:57<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9420, LAS: 0.8913, UEM: 0.5830, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.5733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8078, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||: 100%|##########| 95/95 [01:00<00:00, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9420, LAS: 0.8913, UEM: 0.5830, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.5733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8078, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||: 100%|##########| 95/95 [01:00<00:00, 1.58it/s]\n", + "2023-04-07 00:32:23,942 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - reg_loss | 0.201 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - LEM | 0.343 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EM | 0.903 | N/A\n", + "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.371 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.573 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - loss | 0.808 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - LAS | 0.891 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:32:23,945 - INFO - combo.training.trainer - Epoch duration: 0:01:00.117234\n", + "2023-04-07 00:32:23,945 - INFO - combo.training.trainer - Estimated training time remaining: 5:44:08\n", + "2023-04-07 00:32:23,945 - INFO - allennlp.training.trainer - Epoch 92/399\n", + "2023-04-07 00:32:23,946 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:32:23,946 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:32:23,954 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9442, LAS: 0.8960, UEM: 0.5319, LEM: 0.2802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4404, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7316, loss: 0.7707, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 4%|4 | 4/95 [00:02<00:59, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9456, LAS: 0.8981, UEM: 0.5816, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1495, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4773, loss: 0.7387, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 8%|8 | 8/95 [00:05<00:56, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9471, LAS: 0.9002, UEM: 0.6313, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5522, partial_loss/deprel_loss: 0.6129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 0.7206, batch_reg_loss: 0.2020, reg_loss: 0.2019 ||: 12%|#1 | 11/95 [00:07<00:55, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9462, LAS: 0.8976, UEM: 0.6210, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6778, loss: 0.7467, batch_reg_loss: 0.2020, reg_loss: 0.2019 ||: 16%|#5 | 15/95 [00:09<00:52, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9444, LAS: 0.8952, UEM: 0.6189, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 0.4781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.7662, batch_reg_loss: 0.2020, reg_loss: 0.2020 ||: 20%|## | 19/95 [00:12<00:49, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9434, LAS: 0.8938, UEM: 0.6076, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6140, loss: 0.7728, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||: 23%|##3 | 22/95 [00:14<00:50, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9412, LAS: 0.8916, UEM: 0.5937, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8600, partial_loss/deprel_loss: 0.7354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9624, loss: 0.7932, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||: 26%|##6 | 25/95 [00:16<00:48, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9422, LAS: 0.8923, UEM: 0.5865, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3595, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.7888, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||: 31%|### | 29/95 [00:21<00:55, 1.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9415, LAS: 0.8919, UEM: 0.5860, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.7944, batch_reg_loss: 0.2022, reg_loss: 0.2020 ||: 34%|###3 | 32/95 [00:23<00:50, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9419, LAS: 0.8920, UEM: 0.5921, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.7953, batch_reg_loss: 0.2022, reg_loss: 0.2020 ||: 37%|###6 | 35/95 [00:25<00:46, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9408, LAS: 0.8909, UEM: 0.5806, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9589, partial_loss/deprel_loss: 0.8305, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0585, loss: 0.8064, batch_reg_loss: 0.2023, reg_loss: 0.2021 ||: 41%|####1 | 39/95 [00:28<00:41, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9423, LAS: 0.8925, UEM: 0.5876, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.5269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6876, loss: 0.7962, batch_reg_loss: 0.2023, reg_loss: 0.2021 ||: 44%|####4 | 42/95 [00:30<00:39, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9438, LAS: 0.8944, UEM: 0.6200, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0571, partial_loss/deprel_loss: 0.1655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3461, loss: 0.7831, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||: 47%|####7 | 45/95 [00:33<00:39, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8392, UAS: 0.9418, LAS: 0.8922, UEM: 0.6045, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3574, partial_loss/deprel_loss: 0.9085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2007, loss: 0.8013, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||: 52%|#####1 | 49/95 [00:35<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9072, UAS: 0.9424, LAS: 0.8929, UEM: 0.6013, LEM: 0.3761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3916, partial_loss/deprel_loss: 0.5326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7068, loss: 0.7964, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||: 55%|#####4 | 52/95 [00:37<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9412, LAS: 0.8915, UEM: 0.5947, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4025, partial_loss/deprel_loss: 0.5741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7422, loss: 0.8054, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||: 59%|#####8 | 56/95 [00:40<00:27, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9409, LAS: 0.8910, UEM: 0.5882, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6082, partial_loss/deprel_loss: 0.7029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8864, loss: 0.8087, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||: 62%|######2 | 59/95 [00:42<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9401, LAS: 0.8899, UEM: 0.5841, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2223, partial_loss/deprel_loss: 0.4426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6011, loss: 0.8175, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||: 66%|######6 | 63/95 [00:44<00:21, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9406, LAS: 0.8906, UEM: 0.5872, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.3845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5674, loss: 0.8137, batch_reg_loss: 0.2026, reg_loss: 0.2022 ||: 71%|####### | 67/95 [00:47<00:18, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9401, LAS: 0.8899, UEM: 0.5741, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.5250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7072, loss: 0.8188, batch_reg_loss: 0.2027, reg_loss: 0.2022 ||: 76%|#######5 | 72/95 [00:49<00:13, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9407, LAS: 0.8906, UEM: 0.5698, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7169, loss: 0.8153, batch_reg_loss: 0.2027, reg_loss: 0.2023 ||: 81%|########1 | 77/95 [00:51<00:09, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9411, LAS: 0.8912, UEM: 0.5748, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6897, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8758, loss: 0.8105, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||: 85%|########5 | 81/95 [00:54<00:08, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9416, LAS: 0.8918, UEM: 0.5759, LEM: 0.3427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2683, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.8069, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||: 89%|########9 | 85/95 [00:57<00:06, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8029, UAS: 0.9412, LAS: 0.8914, UEM: 0.5784, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7882, partial_loss/deprel_loss: 1.1323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4663, loss: 0.8093, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||: 94%|#########3| 89/95 [01:00<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9421, LAS: 0.8924, UEM: 0.5892, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.5763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7429, loss: 0.8016, batch_reg_loss: 0.2029, reg_loss: 0.2024 ||: 98%|#########7| 93/95 [01:03<00:01, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9421, LAS: 0.8923, UEM: 0.5866, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7543, partial_loss/deprel_loss: 0.7355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9422, loss: 0.8027, batch_reg_loss: 0.2029, reg_loss: 0.2024 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - reg_loss | 0.202 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - UEM | 0.587 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - LEM | 0.349 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EM | 0.880 | N/A\n", + "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.754 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.736 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - loss | 0.803 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:28,889 - INFO - combo.training.trainer - Epoch duration: 0:01:04.943569\n", + "2023-04-07 00:33:28,889 - INFO - combo.training.trainer - Estimated training time remaining: 5:42:54\n", + "2023-04-07 00:33:28,889 - INFO - allennlp.training.trainer - Epoch 93/399\n", + "2023-04-07 00:33:28,889 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:33:28,890 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:33:28,897 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9551, LAS: 0.9079, UEM: 0.6613, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6752, batch_reg_loss: 0.2029, reg_loss: 0.2029 ||: 3%|3 | 3/95 [00:02<01:07, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9494, LAS: 0.9022, UEM: 0.5784, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6564, loss: 0.7243, batch_reg_loss: 0.2029, reg_loss: 0.2029 ||: 6%|6 | 6/95 [00:04<01:07, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9448, LAS: 0.8972, UEM: 0.5689, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1788, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5143, loss: 0.7537, batch_reg_loss: 0.2030, reg_loss: 0.2029 ||: 11%|# | 10/95 [00:07<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9417, LAS: 0.8925, UEM: 0.5342, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0468, partial_loss/deprel_loss: 0.8551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0965, loss: 0.7887, batch_reg_loss: 0.2030, reg_loss: 0.2029 ||: 15%|#4 | 14/95 [00:09<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9263, UAS: 0.9447, LAS: 0.8960, UEM: 0.5514, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.3764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5609, loss: 0.7672, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 18%|#7 | 17/95 [00:11<00:54, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9473, LAS: 0.8985, UEM: 0.5909, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1812, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5937, loss: 0.7474, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||: 21%|##1 | 20/95 [00:14<00:53, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9474, LAS: 0.8990, UEM: 0.5733, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6749, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8458, loss: 0.7480, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||: 24%|##4 | 23/95 [00:16<00:53, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9447, LAS: 0.8957, UEM: 0.5516, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9470, partial_loss/deprel_loss: 0.8236, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0514, loss: 0.7682, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||: 27%|##7 | 26/95 [00:18<00:50, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9424, LAS: 0.8937, UEM: 0.5940, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9548, partial_loss/deprel_loss: 0.8370, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0637, loss: 0.7856, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||: 31%|### | 29/95 [00:21<00:50, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9420, LAS: 0.8930, UEM: 0.5906, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6104, loss: 0.7914, batch_reg_loss: 0.2032, reg_loss: 0.2030 ||: 35%|###4 | 33/95 [00:24<00:46, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9439, LAS: 0.8952, UEM: 0.6147, LEM: 0.3827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1416, partial_loss/deprel_loss: 0.3271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4932, loss: 0.7750, batch_reg_loss: 0.2032, reg_loss: 0.2030 ||: 38%|###7 | 36/95 [00:26<00:46, 1.27it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9413, LAS: 0.8925, UEM: 0.6020, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9797, partial_loss/deprel_loss: 0.7980, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0376, loss: 0.7976, batch_reg_loss: 0.2032, reg_loss: 0.2031 ||: 42%|####2 | 40/95 [00:29<00:41, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9413, LAS: 0.8926, UEM: 0.6014, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4059, partial_loss/deprel_loss: 0.4809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7987, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||: 45%|####5 | 43/95 [00:31<00:38, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9416, LAS: 0.8929, UEM: 0.5940, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3520, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6282, loss: 0.7982, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||: 48%|####8 | 46/95 [00:33<00:36, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9408, LAS: 0.8923, UEM: 0.5932, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5310, partial_loss/deprel_loss: 0.5824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7755, loss: 0.8032, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||: 52%|#####1 | 49/95 [00:35<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9416, LAS: 0.8931, UEM: 0.5977, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2374, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 0.7971, batch_reg_loss: 0.2034, reg_loss: 0.2031 ||: 55%|#####4 | 52/95 [00:38<00:32, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9422, LAS: 0.8936, UEM: 0.5977, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5264, loss: 0.7912, batch_reg_loss: 0.2034, reg_loss: 0.2031 ||: 58%|#####7 | 55/95 [00:40<00:30, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9437, LAS: 0.8952, UEM: 0.6204, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2211, partial_loss/deprel_loss: 0.4185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.7779, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||: 61%|######1 | 58/95 [00:42<00:27, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9420, LAS: 0.8931, UEM: 0.6115, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2662, partial_loss/deprel_loss: 0.4593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.7915, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||: 65%|######5 | 62/95 [00:45<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9412, LAS: 0.8922, UEM: 0.6038, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.4549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6443, loss: 0.7980, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||: 68%|######8 | 65/95 [00:47<00:21, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9409, LAS: 0.8918, UEM: 0.5969, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2274, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2397, loss: 0.8019, batch_reg_loss: 0.2036, reg_loss: 0.2032 ||: 73%|#######2 | 69/95 [00:49<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9411, LAS: 0.8920, UEM: 0.5903, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5339, partial_loss/deprel_loss: 0.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7377, loss: 0.7999, batch_reg_loss: 0.2036, reg_loss: 0.2032 ||: 77%|#######6 | 73/95 [00:51<00:13, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9417, LAS: 0.8925, UEM: 0.5943, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7405, partial_loss/deprel_loss: 0.7185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9266, loss: 0.7955, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||: 81%|########1 | 77/95 [00:55<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9421, LAS: 0.8926, UEM: 0.5890, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4679, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.7955, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||: 85%|########5 | 81/95 [00:57<00:09, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9419, LAS: 0.8923, UEM: 0.5810, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.4980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6778, loss: 0.7979, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||: 89%|########9 | 85/95 [01:00<00:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9415, LAS: 0.8918, UEM: 0.5821, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4739, loss: 0.8018, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||: 94%|#########3| 89/95 [01:03<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9416, LAS: 0.8919, UEM: 0.5845, LEM: 0.3482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.3629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5262, loss: 0.8018, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||: 98%|#########7| 93/95 [01:05<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9416, LAS: 0.8919, UEM: 0.5828, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4139, partial_loss/deprel_loss: 0.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6835, loss: 0.8025, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||: 100%|##########| 95/95 [01:06<00:00, 1.42it/s]\n", + "2023-04-07 00:34:35,742 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:34:35,742 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - reg_loss | 0.203 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UEM | 0.583 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - LEM | 0.346 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EM | 0.910 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.414 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.496 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.trainer - Epoch duration: 0:01:06.855109\n", + "2023-04-07 00:34:35,744 - INFO - combo.training.trainer - Estimated training time remaining: 5:41:47\n", + "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - Epoch 94/399\n", + "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:34:35,753 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9513, LAS: 0.9046, UEM: 0.5646, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6356, loss: 0.7113, batch_reg_loss: 0.2039, reg_loss: 0.2039 ||: 4%|4 | 4/95 [00:02<00:47, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9367, LAS: 0.8890, UEM: 0.4240, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1801, partial_loss/deprel_loss: 0.8011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0808, loss: 0.8297, batch_reg_loss: 0.2040, reg_loss: 0.2039 ||: 9%|9 | 9/95 [00:04<00:43, 1.98it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9369, LAS: 0.8891, UEM: 0.4268, LEM: 0.2037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7108, partial_loss/deprel_loss: 0.7335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9330, loss: 0.8324, batch_reg_loss: 0.2040, reg_loss: 0.2039 ||: 15%|#4 | 14/95 [00:06<00:40, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9375, LAS: 0.8899, UEM: 0.4594, LEM: 0.2311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4623, partial_loss/deprel_loss: 0.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6893, loss: 0.8311, batch_reg_loss: 0.2041, reg_loss: 0.2040 ||: 20%|## | 19/95 [00:09<00:36, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9387, LAS: 0.8913, UEM: 0.4626, LEM: 0.2315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7904, partial_loss/deprel_loss: 0.7270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9438, loss: 0.8208, batch_reg_loss: 0.2041, reg_loss: 0.2040 ||: 24%|##4 | 23/95 [00:11<00:39, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9386, LAS: 0.8912, UEM: 0.4765, LEM: 0.2432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6284, loss: 0.8215, batch_reg_loss: 0.2042, reg_loss: 0.2040 ||: 28%|##8 | 27/95 [00:15<00:42, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9376, LAS: 0.8897, UEM: 0.4675, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4014, partial_loss/deprel_loss: 0.5172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.8359, batch_reg_loss: 0.2042, reg_loss: 0.2040 ||: 32%|###1 | 30/95 [00:17<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9386, LAS: 0.8901, UEM: 0.4836, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9247, partial_loss/deprel_loss: 0.8234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0479, loss: 0.8314, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||: 35%|###4 | 33/95 [00:19<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9388, LAS: 0.8902, UEM: 0.4774, LEM: 0.2380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5193, partial_loss/deprel_loss: 0.5783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7708, loss: 0.8284, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||: 38%|###7 | 36/95 [00:21<00:41, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9411, LAS: 0.8928, UEM: 0.5396, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4171, partial_loss/deprel_loss: 0.5062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.8082, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||: 41%|####1 | 39/95 [00:24<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9422, LAS: 0.8936, UEM: 0.5387, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3443, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6473, loss: 0.7998, batch_reg_loss: 0.2044, reg_loss: 0.2041 ||: 45%|####5 | 43/95 [00:26<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9431, LAS: 0.8946, UEM: 0.5445, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2948, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6303, loss: 0.7902, batch_reg_loss: 0.2044, reg_loss: 0.2041 ||: 48%|####8 | 46/95 [00:28<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9439, LAS: 0.8954, UEM: 0.5561, LEM: 0.3143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.3991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.7827, batch_reg_loss: 0.2044, reg_loss: 0.2042 ||: 52%|#####1 | 49/95 [00:31<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9432, LAS: 0.8948, UEM: 0.5649, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8301, partial_loss/deprel_loss: 0.9899, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3624, loss: 0.7852, batch_reg_loss: 0.2044, reg_loss: 0.2042 ||: 55%|#####4 | 52/95 [00:33<00:31, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9416, LAS: 0.8934, UEM: 0.5631, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8940, partial_loss/deprel_loss: 1.1273, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4851, loss: 0.7968, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||: 59%|#####8 | 56/95 [00:36<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9414, LAS: 0.8927, UEM: 0.5574, LEM: 0.3150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4748, partial_loss/deprel_loss: 0.5441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8009, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||: 62%|######2 | 59/95 [00:38<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9412, LAS: 0.8925, UEM: 0.5639, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1639, partial_loss/deprel_loss: 0.3403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.8021, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||: 65%|######5 | 62/95 [00:40<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9414, LAS: 0.8924, UEM: 0.5631, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6976, partial_loss/deprel_loss: 0.7252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9242, loss: 0.8013, batch_reg_loss: 0.2046, reg_loss: 0.2042 ||: 68%|######8 | 65/95 [00:42<00:21, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9421, LAS: 0.8934, UEM: 0.5750, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2649, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.7934, batch_reg_loss: 0.2046, reg_loss: 0.2043 ||: 72%|#######1 | 68/95 [00:44<00:19, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9427, LAS: 0.8940, UEM: 0.5783, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7786, partial_loss/deprel_loss: 0.6708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8970, loss: 0.7895, batch_reg_loss: 0.2046, reg_loss: 0.2043 ||: 76%|#######5 | 72/95 [00:47<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8442, UAS: 0.9425, LAS: 0.8938, UEM: 0.5854, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0491, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1294, loss: 0.7899, batch_reg_loss: 0.2047, reg_loss: 0.2043 ||: 79%|#######8 | 75/95 [00:49<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9426, LAS: 0.8938, UEM: 0.5852, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6065, loss: 0.7891, batch_reg_loss: 0.2047, reg_loss: 0.2043 ||: 83%|########3 | 79/95 [00:52<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9423, LAS: 0.8934, UEM: 0.5851, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.6460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8547, loss: 0.7922, batch_reg_loss: 0.2048, reg_loss: 0.2043 ||: 86%|########6 | 82/95 [00:54<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9428, LAS: 0.8939, UEM: 0.5892, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5734, partial_loss/deprel_loss: 0.6591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8468, loss: 0.7884, batch_reg_loss: 0.2048, reg_loss: 0.2043 ||: 89%|########9 | 85/95 [00:56<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9427, LAS: 0.8937, UEM: 0.5876, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4860, loss: 0.7909, batch_reg_loss: 0.2048, reg_loss: 0.2044 ||: 94%|#########3| 89/95 [00:59<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9421, LAS: 0.8930, UEM: 0.5862, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1924, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5408, loss: 0.7960, batch_reg_loss: 0.2049, reg_loss: 0.2044 ||: 98%|#########7| 93/95 [01:01<00:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9426, LAS: 0.8934, UEM: 0.5887, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2714, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6364, loss: 0.7931, batch_reg_loss: 0.2049, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - reg_loss | 0.204 | N/A\n", + "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LEM | 0.348 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - EM | 0.915 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.271 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.471 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - loss | 0.793 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LAS | 0.893 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:35:38,889 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:35:38,889 - INFO - combo.training.trainer - Epoch duration: 0:01:03.144660\n", + "2023-04-07 00:35:38,889 - INFO - combo.training.trainer - Estimated training time remaining: 5:40:27\n", + "2023-04-07 00:35:38,889 - INFO - allennlp.training.trainer - Epoch 95/399\n", + "2023-04-07 00:35:38,890 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:35:38,890 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:35:38,897 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9242, LAS: 0.8762, UEM: 0.2850, LEM: 0.0992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8615, partial_loss/deprel_loss: 0.7358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9659, loss: 0.9411, batch_reg_loss: 0.2049, reg_loss: 0.2049 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9353, LAS: 0.8858, UEM: 0.3636, LEM: 0.1408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4285, partial_loss/deprel_loss: 0.5383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.8561, batch_reg_loss: 0.2050, reg_loss: 0.2049 ||: 8%|8 | 8/95 [00:05<00:56, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9352, LAS: 0.8868, UEM: 0.3439, LEM: 0.1287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6405, partial_loss/deprel_loss: 0.6543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.8527, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 13%|#2 | 12/95 [00:07<00:53, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9419, LAS: 0.8933, UEM: 0.4871, LEM: 0.2392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4230, partial_loss/deprel_loss: 0.5419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7232, loss: 0.7997, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||: 16%|#5 | 15/95 [00:10<00:54, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9448, LAS: 0.8961, UEM: 0.5225, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.7767, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||: 20%|## | 19/95 [00:12<00:50, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9486, LAS: 0.9009, UEM: 0.6363, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2845, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6115, loss: 0.7372, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||: 23%|##3 | 22/95 [00:15<00:55, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9464, LAS: 0.8982, UEM: 0.6087, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 0.7642, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0090, loss: 0.7555, batch_reg_loss: 0.2052, reg_loss: 0.2050 ||: 27%|##7 | 26/95 [00:17<00:49, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9468, LAS: 0.8986, UEM: 0.6059, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2224, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5754, loss: 0.7529, batch_reg_loss: 0.2052, reg_loss: 0.2050 ||: 31%|### | 29/95 [00:20<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9478, LAS: 0.8997, UEM: 0.6138, LEM: 0.3754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2597, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.7434, batch_reg_loss: 0.2052, reg_loss: 0.2051 ||: 34%|###3 | 32/95 [00:22<00:44, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9495, LAS: 0.9011, UEM: 0.6279, LEM: 0.3809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3057, partial_loss/deprel_loss: 0.5072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7326, batch_reg_loss: 0.2052, reg_loss: 0.2051 ||: 37%|###6 | 35/95 [00:24<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9477, LAS: 0.8993, UEM: 0.6249, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0380, partial_loss/deprel_loss: 1.1467, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5302, loss: 0.7497, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||: 41%|####1 | 39/95 [00:26<00:36, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9494, LAS: 0.9009, UEM: 0.6406, LEM: 0.3918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3377, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6790, loss: 0.7387, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||: 46%|####6 | 44/95 [00:28<00:30, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8523, UAS: 0.9472, LAS: 0.8982, UEM: 0.6176, LEM: 0.3726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9144, partial_loss/deprel_loss: 0.7901, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0203, loss: 0.7603, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||: 52%|#####1 | 49/95 [00:30<00:25, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9459, LAS: 0.8968, UEM: 0.6143, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.7709, batch_reg_loss: 0.2054, reg_loss: 0.2052 ||: 57%|#####6 | 54/95 [00:33<00:22, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9452, LAS: 0.8961, UEM: 0.6056, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6259, loss: 0.7803, batch_reg_loss: 0.2054, reg_loss: 0.2052 ||: 61%|######1 | 58/95 [00:36<00:22, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8185, UAS: 0.9436, LAS: 0.8946, UEM: 0.5940, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5388, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2945, loss: 0.7898, batch_reg_loss: 0.2055, reg_loss: 0.2052 ||: 65%|######5 | 62/95 [00:39<00:21, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9433, LAS: 0.8943, UEM: 0.6019, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.7921, batch_reg_loss: 0.2055, reg_loss: 0.2052 ||: 69%|######9 | 66/95 [00:42<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9427, LAS: 0.8936, UEM: 0.5969, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3676, partial_loss/deprel_loss: 0.5613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7281, loss: 0.7958, batch_reg_loss: 0.2056, reg_loss: 0.2052 ||: 74%|#######3 | 70/95 [00:45<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9431, LAS: 0.8940, UEM: 0.5940, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2323, partial_loss/deprel_loss: 0.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.7930, batch_reg_loss: 0.2056, reg_loss: 0.2052 ||: 78%|#######7 | 74/95 [00:47<00:13, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8280, UAS: 0.9425, LAS: 0.8933, UEM: 0.5922, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3858, partial_loss/deprel_loss: 1.0559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3275, loss: 0.7993, batch_reg_loss: 0.2057, reg_loss: 0.2053 ||: 82%|########2 | 78/95 [00:50<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9417, LAS: 0.8922, UEM: 0.5842, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0717, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1375, loss: 0.8070, batch_reg_loss: 0.2057, reg_loss: 0.2053 ||: 86%|########6 | 82/95 [00:52<00:08, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9414, LAS: 0.8918, UEM: 0.5776, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8504, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0116, loss: 0.8100, batch_reg_loss: 0.2058, reg_loss: 0.2053 ||: 91%|######### | 86/95 [00:55<00:05, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9421, LAS: 0.8925, UEM: 0.5823, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.3931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.8046, batch_reg_loss: 0.2058, reg_loss: 0.2053 ||: 95%|#########4| 90/95 [00:58<00:03, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9418, LAS: 0.8923, UEM: 0.5858, LEM: 0.3442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3271, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.8063, batch_reg_loss: 0.2059, reg_loss: 0.2054 ||: 99%|#########8| 94/95 [01:01<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9420, LAS: 0.8924, UEM: 0.5895, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3248, partial_loss/deprel_loss: 0.4186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6058, loss: 0.8041, batch_reg_loss: 0.2059, reg_loss: 0.2054 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 00:36:41,183 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9553, LAS: 0.9034, UEM: 0.7548, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1291, partial_loss/deprel_loss: 40.7917, partial_loss/cycle_loss: 0.0000, batch_loss: 32.8592, loss: 22.6777, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:10, 1.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9617, LAS: 0.9134, UEM: 0.7913, LEM: 0.5315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 8.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0401, loss: 16.5296, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.10s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.9586, LAS: 0.9074, UEM: 0.7498, LEM: 0.4686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0857, partial_loss/deprel_loss: 36.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 29.7964, loss: 18.5827, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:08<00:03, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9500, LAS: 0.8971, UEM: 0.6831, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5525, partial_loss/deprel_loss: 46.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 37.7703, loss: 20.8966, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9500, LAS: 0.8971, UEM: 0.6831, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5525, partial_loss/deprel_loss: 46.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 37.7703, loss: 20.8966, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00, 1.02s/it]\n", + "2023-04-07 00:36:52,373 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:36:52,373 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - reg_loss | 0.205 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | 0.683\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - LEM | 0.348 | 0.411\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EM | 0.909 | 0.849\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.325 | 1.552\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | 0.950\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.419 | 46.825\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - loss | 0.804 | 20.897\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | 0.897\n", + "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:36:52,375 - INFO - combo.training.trainer - Epoch duration: 0:01:13.485998\n", + "2023-04-07 00:36:52,376 - INFO - combo.training.trainer - Estimated training time remaining: 5:39:41\n", + "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - Epoch 96/399\n", + "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:36:52,383 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9413, LAS: 0.8866, UEM: 0.4235, LEM: 0.1511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 0.7699, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0051, loss: 0.8340, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||: 4%|4 | 4/95 [00:02<00:57, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9493, LAS: 0.8960, UEM: 0.4964, LEM: 0.1846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.4901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6643, loss: 0.7739, batch_reg_loss: 0.2060, reg_loss: 0.2059 ||: 8%|8 | 8/95 [00:05<00:54, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9466, LAS: 0.8944, UEM: 0.5602, LEM: 0.2649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.7727, batch_reg_loss: 0.2060, reg_loss: 0.2060 ||: 12%|#1 | 11/95 [00:07<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9500, LAS: 0.8998, UEM: 0.6595, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0433, partial_loss/deprel_loss: 0.1511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3356, loss: 0.7380, batch_reg_loss: 0.2060, reg_loss: 0.2060 ||: 15%|#4 | 14/95 [00:10<00:59, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9471, LAS: 0.8967, UEM: 0.6291, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 0.7544, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||: 19%|#8 | 18/95 [00:12<00:52, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9463, LAS: 0.8958, UEM: 0.6229, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2154, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.7659, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||: 23%|##3 | 22/95 [00:14<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9458, LAS: 0.8956, UEM: 0.6195, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7033, loss: 0.7639, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||: 26%|##6 | 25/95 [00:17<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9459, LAS: 0.8957, UEM: 0.6239, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5298, loss: 0.7614, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||: 29%|##9 | 28/95 [00:19<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9443, LAS: 0.8943, UEM: 0.6144, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.7762, batch_reg_loss: 0.2062, reg_loss: 0.2060 ||: 34%|###3 | 32/95 [00:22<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9448, LAS: 0.8948, UEM: 0.6088, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7992, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9952, loss: 0.7765, batch_reg_loss: 0.2062, reg_loss: 0.2061 ||: 38%|###7 | 36/95 [00:24<00:39, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9458, LAS: 0.8959, UEM: 0.6143, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2885, partial_loss/deprel_loss: 0.4762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.7664, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||: 41%|####1 | 39/95 [00:27<00:42, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9465, LAS: 0.8968, UEM: 0.6353, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1215, partial_loss/deprel_loss: 0.2574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.7600, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||: 44%|####4 | 42/95 [00:29<00:39, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9437, LAS: 0.8938, UEM: 0.6203, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2840, partial_loss/deprel_loss: 0.8396, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1348, loss: 0.7827, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||: 48%|####8 | 46/95 [00:32<00:35, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9449, LAS: 0.8952, UEM: 0.6273, LEM: 0.3820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6025, loss: 0.7730, batch_reg_loss: 0.2064, reg_loss: 0.2061 ||: 52%|#####1 | 49/95 [00:34<00:34, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9463, LAS: 0.8967, UEM: 0.6405, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.5259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7182, loss: 0.7622, batch_reg_loss: 0.2064, reg_loss: 0.2061 ||: 56%|#####5 | 53/95 [00:36<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9452, LAS: 0.8955, UEM: 0.6223, LEM: 0.3794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7172, loss: 0.7743, batch_reg_loss: 0.2064, reg_loss: 0.2062 ||: 61%|######1 | 58/95 [00:39<00:22, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9459, LAS: 0.8959, UEM: 0.6254, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2003, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.7719, batch_reg_loss: 0.2065, reg_loss: 0.2062 ||: 65%|######5 | 62/95 [00:41<00:19, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9453, LAS: 0.8955, UEM: 0.6218, LEM: 0.3792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1490, partial_loss/deprel_loss: 0.3464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5134, loss: 0.7788, batch_reg_loss: 0.2065, reg_loss: 0.2062 ||: 69%|######9 | 66/95 [00:43<00:16, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9442, LAS: 0.8941, UEM: 0.6146, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3394, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6833, loss: 0.7902, batch_reg_loss: 0.2066, reg_loss: 0.2062 ||: 74%|#######3 | 70/95 [00:45<00:13, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9428, LAS: 0.8925, UEM: 0.6090, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2194, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5969, loss: 0.8012, batch_reg_loss: 0.2066, reg_loss: 0.2062 ||: 78%|#######7 | 74/95 [00:48<00:12, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9431, LAS: 0.8928, UEM: 0.6043, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7139, partial_loss/deprel_loss: 0.7457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9460, loss: 0.7995, batch_reg_loss: 0.2067, reg_loss: 0.2063 ||: 82%|########2 | 78/95 [00:51<00:11, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9426, LAS: 0.8923, UEM: 0.6025, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3274, partial_loss/deprel_loss: 0.4576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6383, loss: 0.8013, batch_reg_loss: 0.2067, reg_loss: 0.2063 ||: 86%|########6 | 82/95 [00:53<00:08, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9425, LAS: 0.8922, UEM: 0.5929, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6534, partial_loss/deprel_loss: 0.8070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9830, loss: 0.8033, batch_reg_loss: 0.2068, reg_loss: 0.2063 ||: 91%|######### | 86/95 [00:56<00:06, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9428, LAS: 0.8924, UEM: 0.5966, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4715, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7570, loss: 0.8010, batch_reg_loss: 0.2068, reg_loss: 0.2063 ||: 95%|#########4| 90/95 [00:59<00:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9426, LAS: 0.8921, UEM: 0.5884, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9063, partial_loss/deprel_loss: 0.7899, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0201, loss: 0.8040, batch_reg_loss: 0.2069, reg_loss: 0.2064 ||: 99%|#########8| 94/95 [01:02<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9429, LAS: 0.8924, UEM: 0.5906, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6251, loss: 0.8021, batch_reg_loss: 0.2069, reg_loss: 0.2064 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - reg_loss | 0.206 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UEM | 0.591 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - LEM | 0.345 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EM | 0.920 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.255 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.459 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - loss | 0.802 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:55,221 - INFO - combo.training.trainer - Epoch duration: 0:01:02.845131\n", + "2023-04-07 00:37:55,221 - INFO - combo.training.trainer - Estimated training time remaining: 5:38:21\n", + "2023-04-07 00:37:55,221 - INFO - allennlp.training.trainer - Epoch 97/399\n", + "2023-04-07 00:37:55,221 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:37:55,222 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:37:55,228 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9419, LAS: 0.8920, UEM: 0.3952, LEM: 0.1597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6851, partial_loss/deprel_loss: 0.6447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8597, loss: 0.8136, batch_reg_loss: 0.2069, reg_loss: 0.2069 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9512, LAS: 0.9010, UEM: 0.5581, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2635, partial_loss/deprel_loss: 0.4261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.7490, batch_reg_loss: 0.2070, reg_loss: 0.2069 ||: 8%|8 | 8/95 [00:05<00:57, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9556, LAS: 0.9075, UEM: 0.6934, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1694, partial_loss/deprel_loss: 0.3743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5404, loss: 0.7027, batch_reg_loss: 0.2070, reg_loss: 0.2070 ||: 12%|#1 | 11/95 [00:07<00:59, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9558, LAS: 0.9078, UEM: 0.6931, LEM: 0.4594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1622, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.6936, batch_reg_loss: 0.2070, reg_loss: 0.2070 ||: 15%|#4 | 14/95 [00:09<00:57, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9506, LAS: 0.9026, UEM: 0.6768, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4128, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7064, loss: 0.7229, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||: 19%|#8 | 18/95 [00:12<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9455, LAS: 0.8965, UEM: 0.6393, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4682, partial_loss/deprel_loss: 0.5416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7340, loss: 0.7679, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||: 23%|##3 | 22/95 [00:14<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9432, LAS: 0.8937, UEM: 0.6066, LEM: 0.3802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7097, partial_loss/deprel_loss: 0.6215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8462, loss: 0.7868, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||: 27%|##7 | 26/95 [00:17<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9442, LAS: 0.8947, UEM: 0.6040, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.5566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.7828, batch_reg_loss: 0.2072, reg_loss: 0.2070 ||: 31%|### | 29/95 [00:19<00:46, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9453, LAS: 0.8959, UEM: 0.6047, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.7728, batch_reg_loss: 0.2072, reg_loss: 0.2071 ||: 34%|###3 | 32/95 [00:21<00:43, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9460, LAS: 0.8969, UEM: 0.6114, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1764, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.7677, batch_reg_loss: 0.2072, reg_loss: 0.2071 ||: 37%|###6 | 35/95 [00:24<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9461, LAS: 0.8968, UEM: 0.6037, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6509, partial_loss/deprel_loss: 0.7461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9344, loss: 0.7692, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||: 40%|#### | 38/95 [00:26<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9477, LAS: 0.8984, UEM: 0.6260, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3298, partial_loss/deprel_loss: 0.3937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5882, loss: 0.7543, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||: 43%|####3 | 41/95 [00:28<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9481, LAS: 0.8990, UEM: 0.6309, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1242, partial_loss/deprel_loss: 0.2849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.7516, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||: 47%|####7 | 45/95 [00:31<00:35, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9477, LAS: 0.8984, UEM: 0.6278, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.7560, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||: 51%|##### | 48/95 [00:33<00:34, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9461, LAS: 0.8966, UEM: 0.6145, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 0.7306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.7712, batch_reg_loss: 0.2074, reg_loss: 0.2071 ||: 54%|#####3 | 51/95 [00:35<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9462, LAS: 0.8964, UEM: 0.6060, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5400, partial_loss/deprel_loss: 0.5703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7716, loss: 0.7712, batch_reg_loss: 0.2074, reg_loss: 0.2072 ||: 58%|#####7 | 55/95 [00:38<00:27, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9458, LAS: 0.8962, UEM: 0.6014, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5700, partial_loss/deprel_loss: 0.6182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8160, loss: 0.7742, batch_reg_loss: 0.2074, reg_loss: 0.2072 ||: 61%|######1 | 58/95 [00:40<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9459, LAS: 0.8965, UEM: 0.6113, LEM: 0.3727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0668, partial_loss/deprel_loss: 0.8189, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0759, loss: 0.7712, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||: 64%|######4 | 61/95 [00:42<00:24, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9458, LAS: 0.8966, UEM: 0.6046, LEM: 0.3656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8410, partial_loss/deprel_loss: 0.8078, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0220, loss: 0.7762, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||: 68%|######8 | 65/95 [00:45<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9458, LAS: 0.8967, UEM: 0.6065, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8679, partial_loss/deprel_loss: 0.8099, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0290, loss: 0.7760, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||: 72%|#######1 | 68/95 [00:47<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9443, LAS: 0.8950, UEM: 0.5978, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9440, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0175, loss: 0.7895, batch_reg_loss: 0.2076, reg_loss: 0.2072 ||: 75%|#######4 | 71/95 [00:49<00:16, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9446, LAS: 0.8952, UEM: 0.5970, LEM: 0.3585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6154, loss: 0.7879, batch_reg_loss: 0.2076, reg_loss: 0.2073 ||: 78%|#######7 | 74/95 [00:51<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9448, LAS: 0.8955, UEM: 0.6005, LEM: 0.3605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2562, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5862, loss: 0.7862, batch_reg_loss: 0.2076, reg_loss: 0.2073 ||: 81%|########1 | 77/95 [00:53<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9451, LAS: 0.8959, UEM: 0.6014, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5987, loss: 0.7830, batch_reg_loss: 0.2077, reg_loss: 0.2073 ||: 84%|########4 | 80/95 [00:55<00:10, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8159, UAS: 0.9433, LAS: 0.8938, UEM: 0.5915, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6011, partial_loss/deprel_loss: 0.9215, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2651, loss: 0.7986, batch_reg_loss: 0.2077, reg_loss: 0.2073 ||: 88%|########8 | 84/95 [00:58<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8293, UAS: 0.9430, LAS: 0.8936, UEM: 0.5878, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4834, partial_loss/deprel_loss: 1.0250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3245, loss: 0.8012, batch_reg_loss: 0.2078, reg_loss: 0.2073 ||: 93%|#########2| 88/95 [01:00<00:04, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9427, LAS: 0.8933, UEM: 0.5894, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9498, partial_loss/deprel_loss: 1.1388, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5088, loss: 0.8028, batch_reg_loss: 0.2078, reg_loss: 0.2073 ||: 98%|#########7| 93/95 [01:03<00:01, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9428, LAS: 0.8935, UEM: 0.5891, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7368, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8841, loss: 0.8013, batch_reg_loss: 0.2079, reg_loss: 0.2074 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-07 00:38:59,486 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - reg_loss | 0.207 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - LEM | 0.349 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EM | 0.883 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.737 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.661 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - LAS | 0.894 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:38:59,489 - INFO - combo.training.trainer - Epoch duration: 0:01:04.267507\n", + "2023-04-07 00:38:59,489 - INFO - combo.training.trainer - Estimated training time remaining: 5:37:05\n", + "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - Epoch 98/399\n", + "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:38:59,496 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9357, LAS: 0.8838, UEM: 0.4643, LEM: 0.2083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4956, partial_loss/deprel_loss: 0.9264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2482, loss: 0.8428, batch_reg_loss: 0.2079, reg_loss: 0.2079 ||: 4%|4 | 4/95 [00:02<00:51, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9330, LAS: 0.8817, UEM: 0.3829, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6764, partial_loss/deprel_loss: 0.6329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8496, loss: 0.8622, batch_reg_loss: 0.2079, reg_loss: 0.2079 ||: 7%|7 | 7/95 [00:04<00:52, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9421, LAS: 0.8942, UEM: 0.6039, LEM: 0.4192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0606, partial_loss/deprel_loss: 0.1576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3462, loss: 0.7862, batch_reg_loss: 0.2080, reg_loss: 0.2079 ||: 12%|#1 | 11/95 [00:06<00:51, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9335, LAS: 0.8849, UEM: 0.5404, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6843, partial_loss/deprel_loss: 0.6419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8585, loss: 0.8607, batch_reg_loss: 0.2080, reg_loss: 0.2080 ||: 16%|#5 | 15/95 [00:09<00:49, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9392, LAS: 0.8904, UEM: 0.5790, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6972, loss: 0.8190, batch_reg_loss: 0.2081, reg_loss: 0.2080 ||: 20%|## | 19/95 [00:11<00:46, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9406, LAS: 0.8923, UEM: 0.5903, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4466, partial_loss/deprel_loss: 0.6045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7811, loss: 0.8112, batch_reg_loss: 0.2082, reg_loss: 0.2080 ||: 25%|##5 | 24/95 [00:14<00:40, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9406, LAS: 0.8917, UEM: 0.5703, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6673, loss: 0.8141, batch_reg_loss: 0.2082, reg_loss: 0.2080 ||: 29%|##9 | 28/95 [00:16<00:37, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9413, LAS: 0.8924, UEM: 0.5910, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2402, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5824, loss: 0.8062, batch_reg_loss: 0.2082, reg_loss: 0.2081 ||: 34%|###3 | 32/95 [00:19<00:37, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9426, LAS: 0.8939, UEM: 0.6176, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5229, partial_loss/deprel_loss: 0.6118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8023, loss: 0.7957, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||: 38%|###7 | 36/95 [00:22<00:37, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9405, LAS: 0.8914, UEM: 0.5972, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2203, partial_loss/deprel_loss: 0.8665, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1456, loss: 0.8147, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||: 42%|####2 | 40/95 [00:25<00:36, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9418, LAS: 0.8925, UEM: 0.5959, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7652, loss: 0.8076, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||: 45%|####5 | 43/95 [00:27<00:37, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9430, LAS: 0.8936, UEM: 0.6003, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.4677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6345, loss: 0.7996, batch_reg_loss: 0.2084, reg_loss: 0.2081 ||: 48%|####8 | 46/95 [00:29<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9437, LAS: 0.8944, UEM: 0.6065, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6041, partial_loss/deprel_loss: 0.5779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7916, loss: 0.7918, batch_reg_loss: 0.2084, reg_loss: 0.2081 ||: 52%|#####1 | 49/95 [00:31<00:33, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9444, LAS: 0.8952, UEM: 0.6066, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.4441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7877, batch_reg_loss: 0.2084, reg_loss: 0.2082 ||: 56%|#####5 | 53/95 [00:34<00:30, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9438, LAS: 0.8943, UEM: 0.5992, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7016, loss: 0.7940, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||: 59%|#####8 | 56/95 [00:37<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9423, LAS: 0.8927, UEM: 0.5927, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2788, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6268, loss: 0.8044, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||: 63%|######3 | 60/95 [00:39<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9423, LAS: 0.8927, UEM: 0.5862, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7276, partial_loss/deprel_loss: 0.7248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9339, loss: 0.8041, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||: 67%|######7 | 64/95 [00:41<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9426, LAS: 0.8929, UEM: 0.5919, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.8006, batch_reg_loss: 0.2086, reg_loss: 0.2082 ||: 72%|#######1 | 68/95 [00:45<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9438, LAS: 0.8942, UEM: 0.6073, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1129, partial_loss/deprel_loss: 0.3218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.7909, batch_reg_loss: 0.2086, reg_loss: 0.2083 ||: 75%|#######4 | 71/95 [00:47<00:17, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9430, LAS: 0.8932, UEM: 0.5973, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5020, partial_loss/deprel_loss: 0.6178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8033, loss: 0.7991, batch_reg_loss: 0.2086, reg_loss: 0.2083 ||: 79%|#######8 | 75/95 [00:49<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9435, LAS: 0.8939, UEM: 0.5990, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4111, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.7938, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||: 82%|########2 | 78/95 [00:52<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9432, LAS: 0.8937, UEM: 0.5940, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8354, partial_loss/deprel_loss: 0.7642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9871, loss: 0.7941, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||: 85%|########5 | 81/95 [00:54<00:10, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8602, UAS: 0.9433, LAS: 0.8938, UEM: 0.5930, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9581, partial_loss/deprel_loss: 0.8794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1039, loss: 0.7942, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||: 88%|########8 | 84/95 [00:56<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9430, LAS: 0.8934, UEM: 0.5933, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.7963, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||: 92%|#########1| 87/95 [00:58<00:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9431, LAS: 0.8936, UEM: 0.5931, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.7952, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||: 96%|#########5| 91/95 [01:01<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9427, LAS: 0.8931, UEM: 0.5890, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.7966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0165, loss: 0.7985, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:04<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9427, LAS: 0.8931, UEM: 0.5890, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.7966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0165, loss: 0.7985, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - reg_loss | 0.208 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - LEM | 0.345 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EM | 0.862 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.852 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.797 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - loss | 0.799 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - LAS | 0.893 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:03,538 - INFO - combo.training.trainer - Epoch duration: 0:01:04.049029\n", + "2023-04-07 00:40:03,538 - INFO - combo.training.trainer - Estimated training time remaining: 5:35:49\n", + "2023-04-07 00:40:03,538 - INFO - allennlp.training.trainer - Epoch 99/399\n", + "2023-04-07 00:40:03,538 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:40:03,539 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:40:03,546 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.9333, LAS: 0.8825, UEM: 0.5525, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5290, partial_loss/deprel_loss: 0.9262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2556, loss: 0.8527, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9410, LAS: 0.8895, UEM: 0.6034, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8687, partial_loss/deprel_loss: 0.8306, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0471, loss: 0.8119, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||: 7%|7 | 7/95 [00:04<01:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9387, LAS: 0.8878, UEM: 0.5300, LEM: 0.2876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5496, partial_loss/deprel_loss: 0.5826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7849, loss: 0.8348, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||: 11%|# | 10/95 [00:07<00:59, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9403, LAS: 0.8906, UEM: 0.5537, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8904, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9274, loss: 0.8144, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||: 15%|#4 | 14/95 [00:09<00:55, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9414, LAS: 0.8922, UEM: 0.5599, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0540, partial_loss/deprel_loss: 0.8520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1014, loss: 0.8022, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||: 19%|#8 | 18/95 [00:12<00:51, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9432, LAS: 0.8941, UEM: 0.5652, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3522, partial_loss/deprel_loss: 0.4730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6578, loss: 0.7904, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||: 22%|##2 | 21/95 [00:14<00:51, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9442, LAS: 0.8951, UEM: 0.5852, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2949, partial_loss/deprel_loss: 0.4758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6487, loss: 0.7812, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||: 25%|##5 | 24/95 [00:16<00:49, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9427, LAS: 0.8933, UEM: 0.5612, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5461, partial_loss/deprel_loss: 0.6731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8568, loss: 0.7966, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||: 28%|##8 | 27/95 [00:18<00:47, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9407, LAS: 0.8915, UEM: 0.5802, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1346, partial_loss/deprel_loss: 0.8412, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1090, loss: 0.8129, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||: 32%|###1 | 30/95 [00:20<00:46, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9411, LAS: 0.8917, UEM: 0.5738, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8135, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9402, loss: 0.8104, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||: 35%|###4 | 33/95 [00:23<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9415, LAS: 0.8922, UEM: 0.5693, LEM: 0.3282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7584, partial_loss/deprel_loss: 0.7292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.8085, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||: 38%|###7 | 36/95 [00:25<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9415, LAS: 0.8923, UEM: 0.5604, LEM: 0.3206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3089, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.8075, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||: 41%|####1 | 39/95 [00:27<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9395, LAS: 0.8899, UEM: 0.5407, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7474, partial_loss/deprel_loss: 0.6663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8918, loss: 0.8278, batch_reg_loss: 0.2093, reg_loss: 0.2091 ||: 45%|####5 | 43/95 [00:29<00:35, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9398, LAS: 0.8902, UEM: 0.5434, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5106, partial_loss/deprel_loss: 0.6244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8110, loss: 0.8263, batch_reg_loss: 0.2093, reg_loss: 0.2091 ||: 49%|####9 | 47/95 [00:31<00:30, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9403, LAS: 0.8907, UEM: 0.5577, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4097, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7479, loss: 0.8212, batch_reg_loss: 0.2094, reg_loss: 0.2091 ||: 54%|#####3 | 51/95 [00:33<00:26, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9402, LAS: 0.8905, UEM: 0.5506, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9492, partial_loss/deprel_loss: 0.7954, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0356, loss: 0.8245, batch_reg_loss: 0.2094, reg_loss: 0.2091 ||: 58%|#####7 | 55/95 [00:35<00:22, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9418, LAS: 0.8922, UEM: 0.5665, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.4485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.8104, batch_reg_loss: 0.2095, reg_loss: 0.2092 ||: 63%|######3 | 60/95 [00:38<00:18, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7850, UAS: 0.9407, LAS: 0.8909, UEM: 0.5628, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0868, partial_loss/deprel_loss: 1.1629, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5572, loss: 0.8184, batch_reg_loss: 0.2095, reg_loss: 0.2092 ||: 67%|######7 | 64/95 [00:41<00:18, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9420, LAS: 0.8927, UEM: 0.5980, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7665, loss: 0.8049, batch_reg_loss: 0.2096, reg_loss: 0.2092 ||: 72%|#######1 | 68/95 [00:44<00:17, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9424, LAS: 0.8931, UEM: 0.5918, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5943, partial_loss/deprel_loss: 0.6195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8240, loss: 0.8010, batch_reg_loss: 0.2096, reg_loss: 0.2092 ||: 76%|#######5 | 72/95 [00:47<00:15, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9425, LAS: 0.8932, UEM: 0.5915, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5636, loss: 0.8016, batch_reg_loss: 0.2097, reg_loss: 0.2092 ||: 80%|######## | 76/95 [00:49<00:12, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9430, LAS: 0.8936, UEM: 0.5961, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3083, partial_loss/deprel_loss: 0.4880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7945, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||: 84%|########4 | 80/95 [00:52<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9434, LAS: 0.8940, UEM: 0.5974, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4523, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7340, loss: 0.7911, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||: 88%|########8 | 84/95 [00:55<00:07, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8644, UAS: 0.9434, LAS: 0.8940, UEM: 0.5952, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.7898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0372, loss: 0.7914, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||: 92%|#########1| 87/95 [00:57<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9431, LAS: 0.8936, UEM: 0.5911, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.5760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7902, loss: 0.7939, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||: 95%|#########4| 90/95 [00:59<00:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9432, LAS: 0.8937, UEM: 0.5890, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3280, partial_loss/deprel_loss: 0.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6056, loss: 0.7929, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||: 98%|#########7| 93/95 [01:01<00:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8516, UAS: 0.9429, LAS: 0.8933, UEM: 0.5858, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2694, partial_loss/deprel_loss: 0.8741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1630, loss: 0.7965, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - reg_loss | 0.209 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UEM | 0.586 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - LEM | 0.345 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EM | 0.852 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.269 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.874 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - loss | 0.796 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - LAS | 0.893 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:41:06,739 - INFO - combo.training.trainer - Epoch duration: 0:01:03.200859\n", + "2023-04-07 00:41:06,739 - INFO - combo.training.trainer - Estimated training time remaining: 5:34:31\n", + "2023-04-07 00:41:06,739 - INFO - allennlp.training.trainer - Epoch 100/399\n", + "2023-04-07 00:41:06,739 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:41:06,740 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:41:06,760 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.8957, LAS: 0.8423, UEM: 0.0505, LEM: 0.0051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0992, partial_loss/deprel_loss: 0.8315, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0949, loss: 1.1352, batch_reg_loss: 0.2098, reg_loss: 0.2098 ||: 3%|3 | 3/95 [00:02<01:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9169, LAS: 0.8659, UEM: 0.5052, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3273, partial_loss/deprel_loss: 0.7813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1003, loss: 0.9686, batch_reg_loss: 0.2099, reg_loss: 0.2098 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9282, LAS: 0.8775, UEM: 0.5276, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7433, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9497, loss: 0.8948, batch_reg_loss: 0.2099, reg_loss: 0.2099 ||: 11%|# | 10/95 [00:06<00:57, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9314, LAS: 0.8817, UEM: 0.5023, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5311, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7436, loss: 0.8731, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||: 15%|#4 | 14/95 [00:09<00:52, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9361, LAS: 0.8869, UEM: 0.5188, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4068, partial_loss/deprel_loss: 0.4875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.8388, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||: 18%|#7 | 17/95 [00:11<00:51, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9375, LAS: 0.8890, UEM: 0.5690, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1092, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0216, loss: 0.8185, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||: 21%|##1 | 20/95 [00:13<00:51, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9375, LAS: 0.8888, UEM: 0.5810, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1757, partial_loss/deprel_loss: 0.3448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.8215, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||: 25%|##5 | 24/95 [00:15<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9397, LAS: 0.8913, UEM: 0.6007, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2510, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.8017, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||: 28%|##8 | 27/95 [00:18<00:49, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9424, LAS: 0.8944, UEM: 0.6485, LEM: 0.4256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0601, partial_loss/deprel_loss: 0.1583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.7807, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||: 32%|###1 | 30/95 [00:21<00:51, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9431, LAS: 0.8954, UEM: 0.6496, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2603, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.7749, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||: 35%|###4 | 33/95 [00:23<00:47, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9422, LAS: 0.8947, UEM: 0.6246, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7372, loss: 0.7804, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||: 39%|###8 | 37/95 [00:25<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9418, LAS: 0.8939, UEM: 0.6084, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.7889, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||: 43%|####3 | 41/95 [00:28<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9417, LAS: 0.8937, UEM: 0.6145, LEM: 0.3926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1120, partial_loss/deprel_loss: 0.3045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.7902, batch_reg_loss: 0.2102, reg_loss: 0.2101 ||: 47%|####7 | 45/95 [00:31<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9424, LAS: 0.8945, UEM: 0.6130, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5984, partial_loss/deprel_loss: 0.6446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8456, loss: 0.7852, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||: 51%|##### | 48/95 [00:33<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9436, LAS: 0.8956, UEM: 0.6165, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3159, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6643, loss: 0.7776, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||: 54%|#####3 | 51/95 [00:35<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9439, LAS: 0.8957, UEM: 0.6090, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6701, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.7781, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||: 57%|#####6 | 54/95 [00:37<00:28, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8189, UAS: 0.9428, LAS: 0.8945, UEM: 0.6073, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6892, partial_loss/deprel_loss: 1.0752, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4083, loss: 0.7886, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||: 60%|###### | 57/95 [00:39<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9428, LAS: 0.8944, UEM: 0.5981, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0034, partial_loss/deprel_loss: 0.7920, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0447, loss: 0.7907, batch_reg_loss: 0.2104, reg_loss: 0.2101 ||: 64%|######4 | 61/95 [00:42<00:23, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9423, LAS: 0.8939, UEM: 0.5922, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.4997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.7958, batch_reg_loss: 0.2104, reg_loss: 0.2101 ||: 68%|######8 | 65/95 [00:44<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9430, LAS: 0.8946, UEM: 0.5994, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.4229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6003, loss: 0.7904, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||: 73%|#######2 | 69/95 [00:47<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9433, LAS: 0.8948, UEM: 0.5953, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6593, partial_loss/deprel_loss: 0.6696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8781, loss: 0.7900, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||: 77%|#######6 | 73/95 [00:50<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9430, LAS: 0.8946, UEM: 0.5979, LEM: 0.3656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8570, partial_loss/deprel_loss: 0.6944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9374, loss: 0.7903, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||: 81%|########1 | 77/95 [00:52<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9436, LAS: 0.8948, UEM: 0.5961, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7054, loss: 0.7883, batch_reg_loss: 0.2106, reg_loss: 0.2102 ||: 86%|########6 | 82/95 [00:55<00:08, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9435, LAS: 0.8946, UEM: 0.5942, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0259, partial_loss/deprel_loss: 0.8515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0970, loss: 0.7897, batch_reg_loss: 0.2106, reg_loss: 0.2102 ||: 91%|######### | 86/95 [00:57<00:05, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9424, LAS: 0.8932, UEM: 0.5910, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2694, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.8006, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||: 95%|#########4| 90/95 [00:59<00:02, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9428, LAS: 0.8936, UEM: 0.5896, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6038, partial_loss/deprel_loss: 0.7466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9288, loss: 0.7983, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||: 99%|#########8| 94/95 [01:01<00:00, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9430, LAS: 0.8937, UEM: 0.5892, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4186, partial_loss/deprel_loss: 0.6067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7798, loss: 0.7981, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "2023-04-07 00:42:09,402 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9232, LAS: 0.8683, UEM: 0.2793, LEM: 0.0670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8644, partial_loss/deprel_loss: 23.3140, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8241, loss: 25.2268, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9332, LAS: 0.8790, UEM: 0.4771, LEM: 0.2306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0162, partial_loss/deprel_loss: 30.2918, partial_loss/cycle_loss: 0.0000, batch_loss: 24.4367, loss: 19.9516, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:06, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9460, LAS: 0.8955, UEM: 0.6681, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2215, partial_loss/deprel_loss: 6.6622, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3741, loss: 16.2766, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.02it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9493, LAS: 0.8990, UEM: 0.6866, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 10.1514, partial_loss/cycle_loss: 0.0000, batch_loss: 8.1566, loss: 15.0778, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:01, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9473, LAS: 0.8964, UEM: 0.6672, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1476, partial_loss/deprel_loss: 34.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 27.6170, loss: 16.2177, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02it/s]\n", + "2023-04-07 00:42:20,193 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - reg_loss | 0.210 | 0.000\n", + "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | 0.667\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LEM | 0.349 | 0.406\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - EM | 0.903 | 0.871\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.419 | 1.148\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | 0.947\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.607 | 34.234\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - loss | 0.798 | 16.218\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LAS | 0.894 | 0.896\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:42:23,127 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:42:24,821 - INFO - combo.training.trainer - Epoch duration: 0:01:18.082225\n", + "2023-04-07 00:42:24,822 - INFO - combo.training.trainer - Estimated training time remaining: 5:33:57\n", + "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - Epoch 101/399\n", + "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:42:24,830 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9455, LAS: 0.8939, UEM: 0.5151, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6720, partial_loss/deprel_loss: 0.6995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9047, loss: 0.7793, batch_reg_loss: 0.2108, reg_loss: 0.2108 ||: 3%|3 | 3/95 [00:02<01:12, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9327, LAS: 0.8829, UEM: 0.4016, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7709, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9048, loss: 0.8643, batch_reg_loss: 0.2108, reg_loss: 0.2108 ||: 7%|7 | 7/95 [00:04<01:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9364, LAS: 0.8876, UEM: 0.4195, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8227, loss: 0.8277, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||: 12%|#1 | 11/95 [00:06<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9379, LAS: 0.8884, UEM: 0.4110, LEM: 0.1858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4987, partial_loss/deprel_loss: 0.5354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7389, loss: 0.8165, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||: 15%|#4 | 14/95 [00:09<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9357, LAS: 0.8852, UEM: 0.4233, LEM: 0.1953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.8442, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||: 19%|#8 | 18/95 [00:11<00:51, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9327, LAS: 0.8823, UEM: 0.3946, LEM: 0.1790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8833, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0098, loss: 0.8695, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||: 22%|##2 | 21/95 [00:13<00:49, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9345, LAS: 0.8844, UEM: 0.4073, LEM: 0.1858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8482, partial_loss/deprel_loss: 0.7386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9715, loss: 0.8596, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||: 25%|##5 | 24/95 [00:16<00:50, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9341, LAS: 0.8841, UEM: 0.4211, LEM: 0.1965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.3688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.8643, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||: 28%|##8 | 27/95 [00:18<00:50, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9359, LAS: 0.8858, UEM: 0.4352, LEM: 0.2046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.4803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.8506, batch_reg_loss: 0.2111, reg_loss: 0.2109 ||: 32%|###1 | 30/95 [00:20<00:46, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9387, LAS: 0.8888, UEM: 0.4930, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2998, partial_loss/deprel_loss: 0.4433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.8265, batch_reg_loss: 0.2111, reg_loss: 0.2109 ||: 35%|###4 | 33/95 [00:22<00:44, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9402, LAS: 0.8904, UEM: 0.5115, LEM: 0.2644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.4926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.8160, batch_reg_loss: 0.2112, reg_loss: 0.2109 ||: 38%|###7 | 36/95 [00:24<00:43, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9406, LAS: 0.8904, UEM: 0.5123, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9386, partial_loss/deprel_loss: 0.8632, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0895, loss: 0.8178, batch_reg_loss: 0.2112, reg_loss: 0.2110 ||: 41%|####1 | 39/95 [00:27<00:41, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9419, LAS: 0.8919, UEM: 0.5254, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3000, partial_loss/deprel_loss: 0.4581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.8079, batch_reg_loss: 0.2112, reg_loss: 0.2110 ||: 44%|####4 | 42/95 [00:29<00:40, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9404, LAS: 0.8904, UEM: 0.5121, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0808, partial_loss/deprel_loss: 0.8916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1407, loss: 0.8215, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||: 47%|####7 | 45/95 [00:31<00:37, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9407, LAS: 0.8910, UEM: 0.5141, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7744, partial_loss/deprel_loss: 0.7258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9468, loss: 0.8184, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||: 51%|##### | 48/95 [00:33<00:35, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9412, LAS: 0.8917, UEM: 0.5137, LEM: 0.2666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7934, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9005, loss: 0.8133, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||: 54%|#####3 | 51/95 [00:36<00:32, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9420, LAS: 0.8925, UEM: 0.5334, LEM: 0.2870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8087, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||: 57%|#####6 | 54/95 [00:38<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9412, LAS: 0.8917, UEM: 0.5325, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3427, partial_loss/deprel_loss: 0.9391, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2313, loss: 0.8169, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||: 60%|###### | 57/95 [00:40<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9424, LAS: 0.8928, UEM: 0.5456, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.3578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.8107, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||: 64%|######4 | 61/95 [00:43<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9427, LAS: 0.8930, UEM: 0.5506, LEM: 0.3031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.8349, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0496, loss: 0.8082, batch_reg_loss: 0.2115, reg_loss: 0.2111 ||: 67%|######7 | 64/95 [00:45<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9438, LAS: 0.8942, UEM: 0.5588, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2555, partial_loss/deprel_loss: 0.4168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5961, loss: 0.7995, batch_reg_loss: 0.2115, reg_loss: 0.2111 ||: 72%|#######1 | 68/95 [00:48<00:19, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9438, LAS: 0.8941, UEM: 0.5529, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3956, partial_loss/deprel_loss: 0.5128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7009, loss: 0.8012, batch_reg_loss: 0.2115, reg_loss: 0.2112 ||: 76%|#######5 | 72/95 [00:50<00:15, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9436, LAS: 0.8938, UEM: 0.5466, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4656, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7439, loss: 0.8015, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||: 80%|######## | 76/95 [00:52<00:12, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9447, LAS: 0.8953, UEM: 0.5698, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.3880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5723, loss: 0.7901, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||: 84%|########4 | 80/95 [00:55<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9440, LAS: 0.8948, UEM: 0.5618, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7325, partial_loss/deprel_loss: 0.6691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.7958, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||: 89%|########9 | 85/95 [00:57<00:06, 1.65it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9434, LAS: 0.8941, UEM: 0.5681, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1874, partial_loss/deprel_loss: 0.3598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5370, loss: 0.8008, batch_reg_loss: 0.2117, reg_loss: 0.2112 ||: 94%|#########3| 89/95 [01:00<00:03, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9432, LAS: 0.8939, UEM: 0.5741, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0500, partial_loss/deprel_loss: 0.8519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1033, loss: 0.8011, batch_reg_loss: 0.2117, reg_loss: 0.2113 ||: 98%|#########7| 93/95 [01:02<00:01, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9430, LAS: 0.8939, UEM: 0.5884, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4152, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2854, loss: 0.8015, batch_reg_loss: 0.2117, reg_loss: 0.2113 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 00:43:30,616 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:43:30,616 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - reg_loss | 0.211 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UEM | 0.588 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - LEM | 0.352 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EM | 0.829 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.415 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.988 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - loss | 0.801 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - LAS | 0.894 | N/A\n", + "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:30,622 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:43:35,495 - INFO - combo.training.trainer - Epoch duration: 0:01:10.672863\n", + "2023-04-07 00:43:35,495 - INFO - combo.training.trainer - Estimated training time remaining: 5:33:01\n", + "2023-04-07 00:43:35,495 - INFO - allennlp.training.trainer - Epoch 102/399\n", + "2023-04-07 00:43:35,495 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:43:35,496 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:43:35,504 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9521, LAS: 0.9062, UEM: 0.7124, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1537, partial_loss/deprel_loss: 0.3345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 0.6921, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 3%|3 | 3/95 [00:02<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9536, LAS: 0.9073, UEM: 0.6696, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5607, partial_loss/deprel_loss: 0.6313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8290, loss: 0.6918, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 6%|6 | 6/95 [00:04<01:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9520, LAS: 0.9068, UEM: 0.6532, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4809, loss: 0.6883, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 9%|9 | 9/95 [00:06<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9549, LAS: 0.9105, UEM: 0.6647, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1886, partial_loss/deprel_loss: 0.3493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5289, loss: 0.6660, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 13%|#2 | 12/95 [00:08<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9532, LAS: 0.9078, UEM: 0.6495, LEM: 0.3949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6674, loss: 0.6793, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 16%|#5 | 15/95 [00:10<00:58, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9506, LAS: 0.9038, UEM: 0.6323, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2353, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.7058, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||: 20%|## | 19/95 [00:13<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9511, LAS: 0.9037, UEM: 0.6248, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3517, partial_loss/deprel_loss: 0.5103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.7073, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||: 24%|##4 | 23/95 [00:16<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9505, LAS: 0.9030, UEM: 0.6142, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3182, partial_loss/deprel_loss: 0.4879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6657, loss: 0.7166, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||: 27%|##7 | 26/95 [00:18<00:50, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9508, LAS: 0.9032, UEM: 0.6042, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3389, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6532, loss: 0.7163, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||: 31%|### | 29/95 [00:20<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9487, LAS: 0.9009, UEM: 0.5931, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4692, partial_loss/deprel_loss: 0.5537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7485, loss: 0.7315, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||: 34%|###3 | 32/95 [00:23<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9486, LAS: 0.9007, UEM: 0.5894, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.7299, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||: 38%|###7 | 36/95 [00:25<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9455, LAS: 0.8975, UEM: 0.5728, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2140, partial_loss/deprel_loss: 0.8312, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1194, loss: 0.7540, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||: 42%|####2 | 40/95 [00:28<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9460, LAS: 0.8981, UEM: 0.5713, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0632, partial_loss/deprel_loss: 0.8227, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0824, loss: 0.7558, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 46%|####6 | 44/95 [00:31<00:34, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9459, LAS: 0.8983, UEM: 0.5647, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6393, partial_loss/deprel_loss: 0.5721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.7581, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 51%|##### | 48/95 [00:33<00:31, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9431, LAS: 0.8953, UEM: 0.5522, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8668, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0456, loss: 0.7828, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 55%|#####4 | 52/95 [00:36<00:28, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9428, LAS: 0.8952, UEM: 0.5478, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8932, partial_loss/deprel_loss: 0.7050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9542, loss: 0.7836, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 59%|#####8 | 56/95 [00:38<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9425, LAS: 0.8947, UEM: 0.5395, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7946, partial_loss/deprel_loss: 0.6991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9298, loss: 0.7874, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 63%|######3 | 60/95 [00:41<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9430, LAS: 0.8951, UEM: 0.5460, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1893, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5559, loss: 0.7838, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 66%|######6 | 63/95 [00:44<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9072, UAS: 0.9428, LAS: 0.8948, UEM: 0.5391, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4142, partial_loss/deprel_loss: 0.4686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6693, loss: 0.7874, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 71%|####### | 67/95 [00:46<00:19, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9441, LAS: 0.8964, UEM: 0.5725, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2495, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5878, loss: 0.7745, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||: 74%|#######3 | 70/95 [00:49<00:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9441, LAS: 0.8966, UEM: 0.5679, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6874, partial_loss/deprel_loss: 0.5693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8045, loss: 0.7731, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||: 78%|#######7 | 74/95 [00:52<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9446, LAS: 0.8970, UEM: 0.5734, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.7715, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||: 82%|########2 | 78/95 [00:54<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9452, LAS: 0.8977, UEM: 0.5832, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1146, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4645, loss: 0.7671, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||: 86%|########6 | 82/95 [00:57<00:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9608, UAS: 0.9459, LAS: 0.8986, UEM: 0.5984, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0602, partial_loss/deprel_loss: 0.1530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3459, loss: 0.7613, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||: 89%|########9 | 85/95 [01:01<00:09, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9454, LAS: 0.8981, UEM: 0.5941, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8619, partial_loss/deprel_loss: 0.7147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9556, loss: 0.7658, batch_reg_loss: 0.2115, reg_loss: 0.2116 ||: 93%|#########2| 88/95 [01:04<00:06, 1.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9458, LAS: 0.8986, UEM: 0.5942, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2808, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.7629, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||: 96%|#########5| 91/95 [01:06<00:03, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9449, LAS: 0.8977, UEM: 0.5913, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2987, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.7685, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||: 100%|##########| 95/95 [01:08<00:00, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9449, LAS: 0.8977, UEM: 0.5913, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2987, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.7685, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||: 100%|##########| 95/95 [01:08<00:00, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - reg_loss | 0.212 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UEM | 0.591 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - LEM | 0.359 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EM | 0.914 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.299 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UAS | 0.945 | N/A\n", + "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.430 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - loss | 0.769 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - LAS | 0.898 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:47,229 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:44:53,279 - INFO - combo.training.trainer - Epoch duration: 0:01:17.783558\n", + "2023-04-07 00:44:53,279 - INFO - combo.training.trainer - Estimated training time remaining: 5:32:25\n", + "2023-04-07 00:44:53,279 - INFO - allennlp.training.trainer - Epoch 103/399\n", + "2023-04-07 00:44:53,279 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:44:53,280 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:44:53,288 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9603, LAS: 0.9123, UEM: 0.6606, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6484, loss: 0.6638, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9543, LAS: 0.9080, UEM: 0.5909, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.6053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8156, loss: 0.6955, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||: 7%|7 | 7/95 [00:04<00:59, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9574, LAS: 0.9098, UEM: 0.6177, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3169, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.6811, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||: 11%|# | 10/95 [00:07<00:59, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9529, LAS: 0.9052, UEM: 0.6078, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0751, partial_loss/deprel_loss: 0.8086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0733, loss: 0.7161, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||: 14%|#3 | 13/95 [00:09<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9530, LAS: 0.9058, UEM: 0.6004, LEM: 0.3327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.4136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.7144, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||: 17%|#6 | 16/95 [00:11<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9515, LAS: 0.9047, UEM: 0.5861, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7027, partial_loss/deprel_loss: 0.6695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8874, loss: 0.7294, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||: 21%|##1 | 20/95 [00:14<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9515, LAS: 0.9044, UEM: 0.5928, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3325, partial_loss/deprel_loss: 0.4349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.7300, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||: 24%|##4 | 23/95 [00:16<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9509, LAS: 0.9040, UEM: 0.5738, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.4292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6441, loss: 0.7313, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||: 28%|##8 | 27/95 [00:18<00:45, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9473, LAS: 0.9004, UEM: 0.5564, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1648, partial_loss/deprel_loss: 0.7256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0247, loss: 0.7556, batch_reg_loss: 0.2113, reg_loss: 0.2113 ||: 33%|###2 | 31/95 [00:20<00:41, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9468, LAS: 0.8999, UEM: 0.5468, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7834, partial_loss/deprel_loss: 0.6629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8982, loss: 0.7612, batch_reg_loss: 0.2113, reg_loss: 0.2113 ||: 36%|###5 | 34/95 [00:23<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9481, LAS: 0.9013, UEM: 0.5603, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.4270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6104, loss: 0.7508, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 40%|#### | 38/95 [00:25<00:37, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9485, LAS: 0.9018, UEM: 0.5788, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8666, partial_loss/deprel_loss: 0.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9516, loss: 0.7468, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 43%|####3 | 41/95 [00:27<00:36, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9472, LAS: 0.9004, UEM: 0.5676, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2658, partial_loss/deprel_loss: 0.4552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6285, loss: 0.7578, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 47%|####7 | 45/95 [00:30<00:32, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9471, LAS: 0.9004, UEM: 0.5813, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1070, partial_loss/deprel_loss: 0.7919, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0661, loss: 0.7578, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 52%|#####1 | 49/95 [00:33<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9476, LAS: 0.9013, UEM: 0.5869, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.7513, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 56%|#####5 | 53/95 [00:35<00:28, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9472, LAS: 0.9009, UEM: 0.5792, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3781, partial_loss/deprel_loss: 0.5024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6887, loss: 0.7536, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||: 60%|###### | 57/95 [00:38<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9458, LAS: 0.8993, UEM: 0.5723, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7209, loss: 0.7673, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||: 64%|######4 | 61/95 [00:41<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9708, UAS: 0.9462, LAS: 0.9001, UEM: 0.5942, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0553, partial_loss/deprel_loss: 0.1266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.7626, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||: 67%|######7 | 64/95 [00:43<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9468, LAS: 0.9008, UEM: 0.5974, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5482, loss: 0.7570, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||: 71%|####### | 67/95 [00:46<00:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9470, LAS: 0.9007, UEM: 0.5963, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1547, partial_loss/deprel_loss: 0.3192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4974, loss: 0.7582, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||: 75%|#######4 | 71/95 [00:48<00:17, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9467, LAS: 0.9004, UEM: 0.5969, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9089, partial_loss/deprel_loss: 0.7662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0058, loss: 0.7609, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||: 78%|#######7 | 74/95 [00:50<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9472, LAS: 0.9008, UEM: 0.6026, LEM: 0.3699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1965, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5303, loss: 0.7568, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||: 81%|########1 | 77/95 [00:52<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9479, LAS: 0.9014, UEM: 0.6057, LEM: 0.3696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6917, loss: 0.7527, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||: 85%|########5 | 81/95 [00:55<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9479, LAS: 0.9015, UEM: 0.6086, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6256, partial_loss/deprel_loss: 0.5794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7997, loss: 0.7518, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 88%|########8 | 84/95 [00:57<00:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9481, LAS: 0.9018, UEM: 0.6058, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.4056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5996, loss: 0.7494, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 92%|#########1| 87/95 [00:59<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9486, LAS: 0.9023, UEM: 0.6125, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6809, loss: 0.7445, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 95%|#########4| 90/95 [01:01<00:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9485, LAS: 0.9022, UEM: 0.6137, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6325, partial_loss/deprel_loss: 0.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8000, loss: 0.7444, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 98%|#########7| 93/95 [01:04<00:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9485, LAS: 0.9021, UEM: 0.6115, LEM: 0.3741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3744, partial_loss/deprel_loss: 0.4893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6773, loss: 0.7451, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-07 00:46:02,149 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - reg_loss | 0.211 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UEM | 0.612 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - LEM | 0.374 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EM | 0.909 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.374 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UAS | 0.948 | N/A\n", + "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.489 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - loss | 0.745 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - LAS | 0.902 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:46:02,156 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:46:07,469 - INFO - combo.training.trainer - Epoch duration: 0:01:14.189764\n", + "2023-04-07 00:46:07,469 - INFO - combo.training.trainer - Estimated training time remaining: 5:31:38\n", + "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - Epoch 104/399\n", + "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:46:07,477 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9486, LAS: 0.9035, UEM: 0.5426, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9259, partial_loss/deprel_loss: 0.6544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9197, loss: 0.7281, batch_reg_loss: 0.2110, reg_loss: 0.2110 ||: 5%|5 | 5/95 [00:02<00:42, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9336, LAS: 0.8878, UEM: 0.4455, LEM: 0.2218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1320, partial_loss/deprel_loss: 0.7576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0434, loss: 0.8465, batch_reg_loss: 0.2109, reg_loss: 0.2110 ||: 9%|9 | 9/95 [00:04<00:45, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9352, LAS: 0.8884, UEM: 0.4043, LEM: 0.1875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7125, partial_loss/deprel_loss: 0.6259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.8350, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||: 14%|#3 | 13/95 [00:07<00:43, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9405, LAS: 0.8939, UEM: 0.5158, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1708, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.7897, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||: 17%|#6 | 16/95 [00:09<00:50, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9449, LAS: 0.8988, UEM: 0.5457, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2295, partial_loss/deprel_loss: 0.3936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5717, loss: 0.7572, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||: 21%|##1 | 20/95 [00:12<00:46, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9488, LAS: 0.9029, UEM: 0.5981, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3027, partial_loss/deprel_loss: 0.4291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7248, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||: 25%|##5 | 24/95 [00:14<00:43, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9475, LAS: 0.9023, UEM: 0.6085, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7056, partial_loss/deprel_loss: 0.6024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8339, loss: 0.7343, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||: 31%|### | 29/95 [00:16<00:38, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9636, UAS: 0.9477, LAS: 0.9031, UEM: 0.6416, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0509, partial_loss/deprel_loss: 0.1444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3365, loss: 0.7310, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||: 36%|###5 | 34/95 [00:20<00:35, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9469, LAS: 0.9021, UEM: 0.6232, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6437, partial_loss/deprel_loss: 0.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8182, loss: 0.7407, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||: 40%|#### | 38/95 [00:22<00:34, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9484, LAS: 0.9038, UEM: 0.6286, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.7318, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||: 44%|####4 | 42/95 [00:25<00:34, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9474, LAS: 0.9025, UEM: 0.6257, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5362, partial_loss/deprel_loss: 0.9158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2506, loss: 0.7397, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||: 48%|####8 | 46/95 [00:28<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9482, LAS: 0.9034, UEM: 0.6346, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5049, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7595, loss: 0.7305, batch_reg_loss: 0.2107, reg_loss: 0.2109 ||: 52%|#####1 | 49/95 [00:30<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9499, LAS: 0.9054, UEM: 0.6560, LEM: 0.4268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5495, loss: 0.7160, batch_reg_loss: 0.2107, reg_loss: 0.2109 ||: 55%|#####4 | 52/95 [00:33<00:31, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9496, LAS: 0.9051, UEM: 0.6522, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2033, partial_loss/deprel_loss: 0.3288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.7190, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||: 58%|#####7 | 55/95 [00:35<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8153, UAS: 0.9488, LAS: 0.9044, UEM: 0.6488, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7446, partial_loss/deprel_loss: 1.0545, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4032, loss: 0.7245, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||: 62%|######2 | 59/95 [00:38<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9483, LAS: 0.9038, UEM: 0.6402, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.6823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8959, loss: 0.7292, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||: 65%|######5 | 62/95 [00:40<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9486, LAS: 0.9038, UEM: 0.6324, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.5940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7732, loss: 0.7300, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||: 69%|######9 | 66/95 [00:42<00:19, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9483, LAS: 0.9037, UEM: 0.6228, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7550, partial_loss/deprel_loss: 0.6404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 0.7323, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 74%|#######3 | 70/95 [00:45<00:16, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9474, LAS: 0.9025, UEM: 0.6128, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.4898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.7416, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 78%|#######7 | 74/95 [00:47<00:14, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9474, LAS: 0.9026, UEM: 0.6179, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.7409, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 81%|########1 | 77/95 [00:50<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9479, LAS: 0.9032, UEM: 0.6182, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7365, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 84%|########4 | 80/95 [00:52<00:11, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9478, LAS: 0.9030, UEM: 0.6133, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5621, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.7377, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 87%|########7 | 83/95 [00:54<00:08, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9480, LAS: 0.9029, UEM: 0.6098, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.6598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8806, loss: 0.7389, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 92%|#########1| 87/95 [00:57<00:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9485, LAS: 0.9037, UEM: 0.6098, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4768, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.7351, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||: 96%|#########5| 91/95 [00:59<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9490, LAS: 0.9040, UEM: 0.6130, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.7312, batch_reg_loss: 0.2105, reg_loss: 0.2108 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9490, LAS: 0.9040, UEM: 0.6130, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.7312, batch_reg_loss: 0.2105, reg_loss: 0.2108 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - reg_loss | 0.211 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - UEM | 0.613 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - LEM | 0.378 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EM | 0.909 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.388 | N/A\n", + "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - UAS | 0.949 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.453 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - loss | 0.731 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - LAS | 0.904 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:13,063 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:47:18,026 - INFO - combo.training.trainer - Epoch duration: 0:01:10.556335\n", + "2023-04-07 00:47:18,026 - INFO - combo.training.trainer - Estimated training time remaining: 5:30:40\n", + "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - Epoch 105/399\n", + "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:47:18,036 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9570, LAS: 0.9120, UEM: 0.5975, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.6560, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||: 4%|4 | 4/95 [00:02<00:59, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9531, LAS: 0.9077, UEM: 0.5550, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3870, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7089, loss: 0.6960, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||: 8%|8 | 8/95 [00:05<00:55, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9463, LAS: 0.9007, UEM: 0.4835, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8110, partial_loss/deprel_loss: 0.6490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8919, loss: 0.7512, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||: 13%|#2 | 12/95 [00:07<00:53, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9457, LAS: 0.8996, UEM: 0.4813, LEM: 0.2167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5843, partial_loss/deprel_loss: 0.6242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8267, loss: 0.7601, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||: 16%|#5 | 15/95 [00:09<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9465, LAS: 0.9008, UEM: 0.4827, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7159, partial_loss/deprel_loss: 0.5946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.7534, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||: 19%|#8 | 18/95 [00:11<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9498, LAS: 0.9052, UEM: 0.5952, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1832, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.7230, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||: 22%|##2 | 21/95 [00:14<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9503, LAS: 0.9058, UEM: 0.5896, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.3786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.7190, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||: 25%|##5 | 24/95 [00:16<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9507, LAS: 0.9063, UEM: 0.5772, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4686, partial_loss/deprel_loss: 0.4857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.7133, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||: 29%|##9 | 28/95 [00:18<00:44, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9513, LAS: 0.9068, UEM: 0.5866, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.4758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7079, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||: 33%|###2 | 31/95 [00:20<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9532, LAS: 0.9094, UEM: 0.6135, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2121, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6891, batch_reg_loss: 0.2104, reg_loss: 0.2104 ||: 37%|###6 | 35/95 [00:23<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8089, UAS: 0.9516, LAS: 0.9077, UEM: 0.6169, LEM: 0.3743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7495, partial_loss/deprel_loss: 1.0144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3718, loss: 0.6998, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||: 41%|####1 | 39/95 [00:25<00:35, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9532, LAS: 0.9088, UEM: 0.6282, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2260, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5485, loss: 0.6905, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||: 46%|####6 | 44/95 [00:27<00:29, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9531, LAS: 0.9086, UEM: 0.6165, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5207, partial_loss/deprel_loss: 0.5418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.6937, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||: 52%|#####1 | 49/95 [00:29<00:24, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9533, LAS: 0.9089, UEM: 0.6172, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3151, partial_loss/deprel_loss: 0.4696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6490, loss: 0.6927, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||: 57%|#####6 | 54/95 [00:32<00:22, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9532, LAS: 0.9088, UEM: 0.6171, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7426, partial_loss/deprel_loss: 0.7018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9202, loss: 0.6939, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||: 61%|######1 | 58/95 [00:35<00:21, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8225, UAS: 0.9519, LAS: 0.9073, UEM: 0.6183, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6574, partial_loss/deprel_loss: 0.9583, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3083, loss: 0.7046, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||: 65%|######5 | 62/95 [00:38<00:20, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9515, LAS: 0.9069, UEM: 0.6156, LEM: 0.3664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2118, partial_loss/deprel_loss: 0.3798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.7087, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||: 69%|######9 | 66/95 [00:40<00:17, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9520, LAS: 0.9076, UEM: 0.6303, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1286, partial_loss/deprel_loss: 0.2056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4004, loss: 0.7020, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||: 74%|#######3 | 70/95 [00:43<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9517, LAS: 0.9071, UEM: 0.6325, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6385, loss: 0.7048, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 78%|#######7 | 74/95 [00:47<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9508, LAS: 0.9060, UEM: 0.6239, LEM: 0.3776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4800, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7690, loss: 0.7125, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 82%|########2 | 78/95 [00:49<00:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9497, LAS: 0.9048, UEM: 0.6149, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3706, partial_loss/deprel_loss: 0.5104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 0.7231, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 86%|########6 | 82/95 [00:52<00:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9496, LAS: 0.9047, UEM: 0.6108, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8035, partial_loss/deprel_loss: 0.6049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8548, loss: 0.7240, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 91%|######### | 86/95 [00:54<00:06, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9504, LAS: 0.9054, UEM: 0.6188, LEM: 0.3744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7082, loss: 0.7201, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 95%|#########4| 90/95 [00:58<00:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9502, LAS: 0.9051, UEM: 0.6203, LEM: 0.3784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0376, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0259, loss: 0.7230, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 98%|#########7| 93/95 [01:00<00:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9504, LAS: 0.9055, UEM: 0.6219, LEM: 0.3790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.4989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6951, loss: 0.7205, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 00:48:22,720 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9526, LAS: 0.9053, UEM: 0.7958, LEM: 0.6181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0069, partial_loss/deprel_loss: 28.5755, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0618, loss: 14.0415, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9514, LAS: 0.9038, UEM: 0.6964, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6319, partial_loss/deprel_loss: 14.2944, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5619, loss: 13.0727, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9563, LAS: 0.9079, UEM: 0.7305, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 15.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 12.3029, loss: 12.1444, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:06<00:03, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9524, LAS: 0.9031, UEM: 0.7130, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 10.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4927, loss: 13.7313, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.01it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9500, LAS: 0.8992, UEM: 0.6770, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8960, partial_loss/deprel_loss: 21.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 17.4634, loss: 15.1769, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.03it/s]\n", + "2023-04-07 00:48:33,390 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:48:33,390 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - reg_loss | 0.210 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UEM | 0.622 | 0.677\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LEM | 0.379 | 0.416\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EM | 0.912 | 0.890\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.430 | 0.896\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | 0.950\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.499 | 21.605\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - loss | 0.720 | 15.177\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LAS | 0.905 | 0.899\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:48:33,396 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:48:38,203 - INFO - combo.training.trainer - Epoch duration: 0:01:20.176690\n", + "2023-04-07 00:48:38,204 - INFO - combo.training.trainer - Estimated training time remaining: 5:30:08\n", + "2023-04-07 00:48:38,204 - INFO - allennlp.training.trainer - Epoch 106/399\n", + "2023-04-07 00:48:38,204 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:48:38,205 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:48:38,215 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9498, LAS: 0.9024, UEM: 0.4920, LEM: 0.2301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5409, partial_loss/deprel_loss: 0.5081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7247, loss: 0.7104, batch_reg_loss: 0.2101, reg_loss: 0.2101 ||: 3%|3 | 3/95 [00:02<01:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9462, LAS: 0.9003, UEM: 0.5475, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7342, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8453, loss: 0.7253, batch_reg_loss: 0.2100, reg_loss: 0.2101 ||: 6%|6 | 6/95 [00:04<01:09, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9498, LAS: 0.9057, UEM: 0.6378, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1322, partial_loss/deprel_loss: 0.2281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4189, loss: 0.6960, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||: 9%|9 | 9/95 [00:06<01:05, 1.31it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9505, LAS: 0.9063, UEM: 0.6819, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5320, loss: 0.6906, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||: 13%|#2 | 12/95 [00:09<01:03, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9497, LAS: 0.9052, UEM: 0.6633, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.4268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6081, loss: 0.7021, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||: 16%|#5 | 15/95 [00:11<00:58, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9518, LAS: 0.9075, UEM: 0.6630, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.6882, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||: 19%|#8 | 18/95 [00:13<00:58, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9543, LAS: 0.9107, UEM: 0.6664, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5650, loss: 0.6702, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||: 23%|##3 | 22/95 [00:15<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9533, LAS: 0.9099, UEM: 0.6436, LEM: 0.4015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3590, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6474, loss: 0.6792, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||: 27%|##7 | 26/95 [00:18<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9548, LAS: 0.9112, UEM: 0.6559, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2568, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.6713, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||: 31%|### | 29/95 [00:20<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9549, LAS: 0.9112, UEM: 0.6425, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4614, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6885, loss: 0.6705, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||: 34%|###3 | 32/95 [00:22<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9560, LAS: 0.9123, UEM: 0.6523, LEM: 0.4023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.4142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.6607, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||: 38%|###7 | 36/95 [00:24<00:38, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9521, LAS: 0.9079, UEM: 0.6326, LEM: 0.3877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5551, partial_loss/deprel_loss: 0.5666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 0.6933, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||: 42%|####2 | 40/95 [00:26<00:33, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9514, LAS: 0.9071, UEM: 0.6180, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2428, partial_loss/deprel_loss: 0.4172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.6998, batch_reg_loss: 0.2098, reg_loss: 0.2100 ||: 47%|####7 | 45/95 [00:29<00:28, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9517, LAS: 0.9073, UEM: 0.6297, LEM: 0.3848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1789, partial_loss/deprel_loss: 0.3202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.6986, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||: 52%|#####1 | 49/95 [00:31<00:25, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9510, LAS: 0.9064, UEM: 0.6171, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7447, partial_loss/deprel_loss: 0.7049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9226, loss: 0.7078, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||: 56%|#####5 | 53/95 [00:33<00:23, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9518, LAS: 0.9075, UEM: 0.6210, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7524, loss: 0.7021, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||: 60%|###### | 57/95 [00:36<00:23, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9513, LAS: 0.9070, UEM: 0.6121, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3028, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6319, loss: 0.7062, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||: 64%|######4 | 61/95 [00:38<00:20, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9509, LAS: 0.9065, UEM: 0.6052, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6779, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8502, loss: 0.7111, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 68%|######8 | 65/95 [00:41<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9506, LAS: 0.9060, UEM: 0.6054, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3979, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.7159, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 73%|#######2 | 69/95 [00:44<00:16, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9499, LAS: 0.9054, UEM: 0.6007, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.7208, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 77%|#######6 | 73/95 [00:46<00:13, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9501, LAS: 0.9055, UEM: 0.5959, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3291, partial_loss/deprel_loss: 0.4398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.7204, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 81%|########1 | 77/95 [00:49<00:11, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9508, LAS: 0.9062, UEM: 0.6101, LEM: 0.3644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0923, partial_loss/deprel_loss: 0.2688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.7151, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 85%|########5 | 81/95 [00:52<00:09, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9513, LAS: 0.9068, UEM: 0.6119, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5942, loss: 0.7124, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||: 88%|########8 | 84/95 [00:55<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9515, LAS: 0.9071, UEM: 0.6116, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9652, loss: 0.7113, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 93%|#########2| 88/95 [00:57<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9511, LAS: 0.9067, UEM: 0.6071, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4269, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.7147, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 97%|#########6| 92/95 [01:00<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9516, LAS: 0.9075, UEM: 0.6207, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7087, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 100%|##########| 95/95 [01:02<00:00, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9516, LAS: 0.9075, UEM: 0.6207, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7087, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:49:43,998 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - reg_loss | 0.210 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UEM | 0.621 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - LEM | 0.381 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EM | 0.917 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.449 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UAS | 0.952 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.418 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - loss | 0.709 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - LAS | 0.908 | N/A\n", + "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:44,005 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:49:48,752 - INFO - combo.training.trainer - Epoch duration: 0:01:10.547947\n", + "2023-04-07 00:49:48,752 - INFO - combo.training.trainer - Estimated training time remaining: 5:29:10\n", + "2023-04-07 00:49:48,752 - INFO - allennlp.training.trainer - Epoch 107/399\n", + "2023-04-07 00:49:48,753 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:49:48,753 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:49:48,763 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9279, LAS: 0.8832, UEM: 0.2030, LEM: 0.0752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7221, partial_loss/deprel_loss: 0.6773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8958, loss: 0.9065, batch_reg_loss: 0.2096, reg_loss: 0.2096 ||: 3%|3 | 3/95 [00:02<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9411, LAS: 0.8992, UEM: 0.6315, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5848, loss: 0.7685, batch_reg_loss: 0.2096, reg_loss: 0.2096 ||: 6%|6 | 6/95 [00:04<01:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9444, LAS: 0.9015, UEM: 0.6124, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.4668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6510, loss: 0.7529, batch_reg_loss: 0.2095, reg_loss: 0.2096 ||: 11%|# | 10/95 [00:06<00:56, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9440, LAS: 0.9006, UEM: 0.6267, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5338, loss: 0.7550, batch_reg_loss: 0.2095, reg_loss: 0.2096 ||: 14%|#3 | 13/95 [00:09<01:00, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9447, LAS: 0.9009, UEM: 0.6051, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3996, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6789, loss: 0.7548, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||: 18%|#7 | 17/95 [00:12<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9475, LAS: 0.9039, UEM: 0.6153, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.4225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6152, loss: 0.7260, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||: 21%|##1 | 20/95 [00:14<00:53, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9497, LAS: 0.9067, UEM: 0.6197, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.7098, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||: 24%|##4 | 23/95 [00:16<00:51, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9518, LAS: 0.9089, UEM: 0.6527, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4767, loss: 0.6938, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||: 27%|##7 | 26/95 [00:18<00:51, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9525, LAS: 0.9096, UEM: 0.6346, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.4881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.6928, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||: 32%|###1 | 30/95 [00:21<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9512, LAS: 0.9084, UEM: 0.6289, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7776, partial_loss/deprel_loss: 0.6976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9230, loss: 0.7011, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||: 35%|###4 | 33/95 [00:23<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8602, UAS: 0.9497, LAS: 0.9069, UEM: 0.6102, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1460, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.7117, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||: 39%|###8 | 37/95 [00:26<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9505, LAS: 0.9075, UEM: 0.6062, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5865, loss: 0.7071, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||: 42%|####2 | 40/95 [00:28<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9510, LAS: 0.9079, UEM: 0.6074, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6283, loss: 0.7037, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||: 46%|####6 | 44/95 [00:30<00:33, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9505, LAS: 0.9074, UEM: 0.6036, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7993, partial_loss/deprel_loss: 0.6920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9228, loss: 0.7085, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||: 51%|##### | 48/95 [00:32<00:29, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9510, LAS: 0.9079, UEM: 0.6014, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4517, partial_loss/deprel_loss: 0.5461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7366, loss: 0.7052, batch_reg_loss: 0.2093, reg_loss: 0.2095 ||: 55%|#####4 | 52/95 [00:34<00:25, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9512, LAS: 0.9079, UEM: 0.5973, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4527, partial_loss/deprel_loss: 0.5273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7217, loss: 0.7043, batch_reg_loss: 0.2093, reg_loss: 0.2095 ||: 60%|###### | 57/95 [00:37<00:21, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9517, LAS: 0.9084, UEM: 0.6008, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2877, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.7005, batch_reg_loss: 0.2093, reg_loss: 0.2094 ||: 65%|######5 | 62/95 [00:39<00:17, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9507, LAS: 0.9072, UEM: 0.5863, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5253, partial_loss/deprel_loss: 0.5571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7600, loss: 0.7086, batch_reg_loss: 0.2093, reg_loss: 0.2094 ||: 71%|####### | 67/95 [00:41<00:13, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9510, LAS: 0.9074, UEM: 0.5902, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3831, partial_loss/deprel_loss: 0.4447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.7070, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||: 76%|#######5 | 72/95 [00:45<00:13, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9507, LAS: 0.9074, UEM: 0.6074, LEM: 0.3759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.4206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.7075, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||: 80%|######## | 76/95 [00:48<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9512, LAS: 0.9079, UEM: 0.6104, LEM: 0.3769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3422, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6485, loss: 0.7034, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||: 84%|########4 | 80/95 [00:51<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9517, LAS: 0.9086, UEM: 0.6212, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1150, partial_loss/deprel_loss: 0.2780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.6978, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||: 88%|########8 | 84/95 [00:53<00:06, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.9509, LAS: 0.9077, UEM: 0.6160, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6555, partial_loss/deprel_loss: 0.9330, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2867, loss: 0.7047, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||: 93%|#########2| 88/95 [00:56<00:04, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9509, LAS: 0.9076, UEM: 0.6166, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5582, partial_loss/deprel_loss: 0.5507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.7061, batch_reg_loss: 0.2091, reg_loss: 0.2094 ||: 97%|#########6| 92/95 [00:59<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9514, LAS: 0.9081, UEM: 0.6205, LEM: 0.3876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4833, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7664, loss: 0.7025, batch_reg_loss: 0.2091, reg_loss: 0.2094 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:50:52,802 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - reg_loss | 0.209 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UEM | 0.621 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - LEM | 0.388 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EM | 0.904 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.483 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UAS | 0.951 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.576 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - loss | 0.702 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - LAS | 0.908 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:52,809 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:50:58,225 - INFO - combo.training.trainer - Epoch duration: 0:01:09.472212\n", + "2023-04-07 00:50:58,225 - INFO - combo.training.trainer - Estimated training time remaining: 5:28:08\n", + "2023-04-07 00:50:58,226 - INFO - allennlp.training.trainer - Epoch 108/399\n", + "2023-04-07 00:50:58,226 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:50:58,227 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:50:58,237 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9554, LAS: 0.9106, UEM: 0.5932, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1861, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5072, loss: 0.7211, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||: 3%|3 | 3/95 [00:02<01:11, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8598, UAS: 0.9537, LAS: 0.9107, UEM: 0.7085, LEM: 0.4866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1022, partial_loss/deprel_loss: 0.7836, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0564, loss: 0.7066, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||: 7%|7 | 7/95 [00:04<01:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9580, LAS: 0.9153, UEM: 0.7221, LEM: 0.4892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.6625, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||: 11%|# | 10/95 [00:07<01:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9570, LAS: 0.9129, UEM: 0.6728, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.4736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6552, loss: 0.6820, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||: 15%|#4 | 14/95 [00:09<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9569, LAS: 0.9138, UEM: 0.6635, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6611, loss: 0.6735, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||: 19%|#8 | 18/95 [00:12<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9581, LAS: 0.9150, UEM: 0.6645, LEM: 0.4206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 0.6635, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||: 22%|##2 | 21/95 [00:14<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9588, LAS: 0.9162, UEM: 0.6591, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.6562, batch_reg_loss: 0.2090, reg_loss: 0.2090 ||: 26%|##6 | 25/95 [00:17<00:49, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9580, LAS: 0.9155, UEM: 0.6468, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7635, partial_loss/deprel_loss: 0.6478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8799, loss: 0.6586, batch_reg_loss: 0.2090, reg_loss: 0.2090 ||: 31%|### | 29/95 [00:19<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9563, LAS: 0.9135, UEM: 0.6265, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7999, partial_loss/deprel_loss: 0.6219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8664, loss: 0.6706, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||: 34%|###3 | 32/95 [00:21<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9566, LAS: 0.9138, UEM: 0.6330, LEM: 0.3886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.4875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7165, loss: 0.6644, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||: 37%|###6 | 35/95 [00:24<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9557, LAS: 0.9128, UEM: 0.6217, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8190, partial_loss/deprel_loss: 0.6872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9225, loss: 0.6715, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||: 41%|####1 | 39/95 [00:26<00:38, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9537, LAS: 0.9106, UEM: 0.6048, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5283, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.6887, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||: 45%|####5 | 43/95 [00:29<00:33, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9538, LAS: 0.9108, UEM: 0.6031, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5701, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.6881, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||: 49%|####9 | 47/95 [00:31<00:31, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9543, LAS: 0.9113, UEM: 0.6065, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4044, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6556, loss: 0.6834, batch_reg_loss: 0.2088, reg_loss: 0.2090 ||: 54%|#####3 | 51/95 [00:34<00:29, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9541, LAS: 0.9109, UEM: 0.6083, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1321, partial_loss/deprel_loss: 0.7378, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0255, loss: 0.6860, batch_reg_loss: 0.2088, reg_loss: 0.2090 ||: 58%|#####7 | 55/95 [00:37<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9532, LAS: 0.9099, UEM: 0.6028, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5912, loss: 0.6913, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||: 62%|######2 | 59/95 [00:39<00:24, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9522, LAS: 0.9089, UEM: 0.5919, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5001, partial_loss/deprel_loss: 0.5308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.6973, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||: 66%|######6 | 63/95 [00:42<00:21, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9524, LAS: 0.9093, UEM: 0.6102, LEM: 0.3798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5797, partial_loss/deprel_loss: 0.6738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8638, loss: 0.6955, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||: 71%|####### | 67/95 [00:45<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9510, LAS: 0.9080, UEM: 0.6014, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4449, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6341, loss: 0.7026, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||: 75%|#######4 | 71/95 [00:47<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9517, LAS: 0.9088, UEM: 0.6074, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3527, partial_loss/deprel_loss: 0.3824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5852, loss: 0.6971, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||: 80%|######## | 76/95 [00:50<00:11, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9527, LAS: 0.9099, UEM: 0.6241, LEM: 0.3919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2745, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.6882, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||: 84%|########4 | 80/95 [00:52<00:08, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9521, LAS: 0.9091, UEM: 0.6147, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6618, partial_loss/deprel_loss: 0.6279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.6943, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||: 89%|########9 | 85/95 [00:54<00:05, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9519, LAS: 0.9088, UEM: 0.6121, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6193, partial_loss/deprel_loss: 0.6511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8534, loss: 0.6958, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||: 94%|#########3| 89/95 [00:56<00:03, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9526, LAS: 0.9094, UEM: 0.6191, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3453, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.6909, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||: 98%|#########7| 93/95 [00:59<00:01, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9523, LAS: 0.9091, UEM: 0.6216, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1122, partial_loss/deprel_loss: 0.2778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4534, loss: 0.6928, batch_reg_loss: 0.2086, reg_loss: 0.2089 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer - reg_loss | 0.209 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UEM | 0.622 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LEM | 0.389 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EM | 0.940 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.112 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UAS | 0.952 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.278 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - loss | 0.693 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LAS | 0.909 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:52:02,863 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:52:07,709 - INFO - combo.training.trainer - Epoch duration: 0:01:09.483094\n", + "2023-04-07 00:52:07,709 - INFO - combo.training.trainer - Estimated training time remaining: 5:27:06\n", + "2023-04-07 00:52:07,709 - INFO - allennlp.training.trainer - Epoch 109/399\n", + "2023-04-07 00:52:07,709 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:52:07,710 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:52:07,717 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9737, LAS: 0.9335, UEM: 0.8213, LEM: 0.5670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.4883, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||: 3%|3 | 3/95 [00:02<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9638, LAS: 0.9217, UEM: 0.7067, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3636, partial_loss/deprel_loss: 0.4693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.6022, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||: 7%|7 | 7/95 [00:04<01:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9561, LAS: 0.9129, UEM: 0.6724, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.5999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7991, loss: 0.6619, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||: 11%|# | 10/95 [00:06<00:59, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9543, LAS: 0.9103, UEM: 0.6235, LEM: 0.3683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3306, partial_loss/deprel_loss: 0.5062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.6850, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||: 15%|#4 | 14/95 [00:09<00:54, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9574, LAS: 0.9142, UEM: 0.6780, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1156, partial_loss/deprel_loss: 0.2067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3970, loss: 0.6520, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 18%|#7 | 17/95 [00:11<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9594, LAS: 0.9161, UEM: 0.6983, LEM: 0.4522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2219, partial_loss/deprel_loss: 0.4078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.6379, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 21%|##1 | 20/95 [00:13<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9587, LAS: 0.9145, UEM: 0.6847, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5254, partial_loss/deprel_loss: 0.5624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7635, loss: 0.6516, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 24%|##4 | 23/95 [00:16<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9586, LAS: 0.9149, UEM: 0.6768, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.4095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6073, loss: 0.6530, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 27%|##7 | 26/95 [00:18<00:51, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9536, LAS: 0.9092, UEM: 0.6545, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.6837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9414, loss: 0.6911, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 31%|### | 29/95 [00:20<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9550, LAS: 0.9107, UEM: 0.6705, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4781, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.6806, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||: 34%|###3 | 32/95 [00:22<00:46, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9550, LAS: 0.9108, UEM: 0.6640, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.6793, batch_reg_loss: 0.2085, reg_loss: 0.2085 ||: 37%|###6 | 35/95 [00:25<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9554, LAS: 0.9116, UEM: 0.6613, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1922, partial_loss/deprel_loss: 0.2809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4716, loss: 0.6733, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 40%|#### | 38/95 [00:27<00:42, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9545, LAS: 0.9108, UEM: 0.6472, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7462, loss: 0.6796, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 43%|####3 | 41/95 [00:29<00:40, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9557, LAS: 0.9123, UEM: 0.6722, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3647, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6505, loss: 0.6698, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 46%|####6 | 44/95 [00:32<00:39, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9557, LAS: 0.9123, UEM: 0.6712, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3744, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6922, loss: 0.6716, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 51%|##### | 48/95 [00:34<00:34, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9554, LAS: 0.9121, UEM: 0.6678, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8979, partial_loss/deprel_loss: 0.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9726, loss: 0.6757, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 54%|#####3 | 51/95 [00:36<00:32, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9561, LAS: 0.9128, UEM: 0.6685, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2373, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5406, loss: 0.6699, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||: 57%|#####6 | 54/95 [00:39<00:31, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9567, LAS: 0.9137, UEM: 0.6687, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2389, partial_loss/deprel_loss: 0.3803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.6649, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||: 61%|######1 | 58/95 [00:42<00:27, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9560, LAS: 0.9128, UEM: 0.6614, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5460, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8166, loss: 0.6726, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||: 64%|######4 | 61/95 [00:44<00:24, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9563, LAS: 0.9133, UEM: 0.6652, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1201, partial_loss/deprel_loss: 0.2667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.6687, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||: 67%|######7 | 64/95 [00:46<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9556, LAS: 0.9127, UEM: 0.6565, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7757, partial_loss/deprel_loss: 0.6345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 0.6739, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||: 72%|#######1 | 68/95 [00:49<00:19, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9551, LAS: 0.9123, UEM: 0.6508, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6654, loss: 0.6765, batch_reg_loss: 0.2083, reg_loss: 0.2084 ||: 76%|#######5 | 72/95 [00:51<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9544, LAS: 0.9115, UEM: 0.6458, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4878, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6566, loss: 0.6817, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 80%|######## | 76/95 [00:54<00:12, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9547, LAS: 0.9119, UEM: 0.6430, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5226, partial_loss/deprel_loss: 0.5032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7153, loss: 0.6791, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 84%|########4 | 80/95 [00:56<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9538, LAS: 0.9108, UEM: 0.6404, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.3280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4967, loss: 0.6843, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 88%|########8 | 84/95 [00:59<00:07, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9537, LAS: 0.9106, UEM: 0.6383, LEM: 0.4030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5488, partial_loss/deprel_loss: 0.5528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.6862, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 93%|#########2| 88/95 [01:01<00:04, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9532, LAS: 0.9100, UEM: 0.6286, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7232, partial_loss/deprel_loss: 0.5868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8223, loss: 0.6904, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 98%|#########7| 93/95 [01:03<00:01, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9532, LAS: 0.9100, UEM: 0.6285, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1779, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5553, loss: 0.6906, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - reg_loss | 0.208 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - UEM | 0.629 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - LEM | 0.393 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EM | 0.933 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.178 | N/A\n", + "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - UAS | 0.953 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.389 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - loss | 0.691 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - LAS | 0.910 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:53:15,575 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:53:20,146 - INFO - combo.training.trainer - Epoch duration: 0:01:12.436840\n", + "2023-04-07 00:53:20,147 - INFO - combo.training.trainer - Estimated training time remaining: 5:26:12\n", + "2023-04-07 00:53:20,147 - INFO - allennlp.training.trainer - Epoch 110/399\n", + "2023-04-07 00:53:20,147 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:53:20,148 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:53:20,156 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9701, LAS: 0.9316, UEM: 0.8100, LEM: 0.6100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1711, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5030, loss: 0.5320, batch_reg_loss: 0.2082, reg_loss: 0.2082 ||: 4%|4 | 4/95 [00:02<00:47, 1.92it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9519, LAS: 0.9116, UEM: 0.6588, LEM: 0.4655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4492, partial_loss/deprel_loss: 0.4790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.6690, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||: 9%|9 | 9/95 [00:04<00:42, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8418, UAS: 0.9484, LAS: 0.9073, UEM: 0.6214, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3577, partial_loss/deprel_loss: 0.7750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0997, loss: 0.6918, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||: 14%|#3 | 13/95 [00:06<00:43, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9496, LAS: 0.9090, UEM: 0.6142, LEM: 0.4085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4898, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6281, loss: 0.6798, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||: 18%|#7 | 17/95 [00:09<00:43, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9502, LAS: 0.9097, UEM: 0.6272, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1815, partial_loss/deprel_loss: 0.3025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4864, loss: 0.6779, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||: 22%|##2 | 21/95 [00:11<00:42, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9501, LAS: 0.9099, UEM: 0.6164, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5556, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7572, loss: 0.6785, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||: 26%|##6 | 25/95 [00:14<00:40, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9503, LAS: 0.9097, UEM: 0.6350, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1782, partial_loss/deprel_loss: 0.8499, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1236, loss: 0.6830, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 29%|##9 | 28/95 [00:16<00:41, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9508, LAS: 0.9102, UEM: 0.6442, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6302, partial_loss/deprel_loss: 0.6189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.6801, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 33%|###2 | 31/95 [00:18<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9524, LAS: 0.9118, UEM: 0.6488, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2152, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.6697, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 36%|###5 | 34/95 [00:21<00:45, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9520, LAS: 0.9110, UEM: 0.6294, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.6780, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 40%|#### | 38/95 [00:23<00:40, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9528, LAS: 0.9117, UEM: 0.6301, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.6748, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 43%|####3 | 41/95 [00:26<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9522, LAS: 0.9110, UEM: 0.6249, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5574, loss: 0.6809, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||: 46%|####6 | 44/95 [00:28<00:37, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9524, LAS: 0.9111, UEM: 0.6271, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7328, partial_loss/deprel_loss: 0.6320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8601, loss: 0.6801, batch_reg_loss: 0.2079, reg_loss: 0.2081 ||: 49%|####9 | 47/95 [00:30<00:34, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9531, LAS: 0.9117, UEM: 0.6350, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2185, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.6734, batch_reg_loss: 0.2079, reg_loss: 0.2081 ||: 53%|#####2 | 50/95 [00:32<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9525, LAS: 0.9113, UEM: 0.6358, LEM: 0.4071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5059, partial_loss/deprel_loss: 0.8047, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1528, loss: 0.6778, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||: 56%|#####5 | 53/95 [00:35<00:30, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9525, LAS: 0.9112, UEM: 0.6277, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5079, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.6800, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||: 60%|###### | 57/95 [00:37<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9517, LAS: 0.9103, UEM: 0.6262, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7173, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.6859, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||: 63%|######3 | 60/95 [00:39<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9513, LAS: 0.9099, UEM: 0.6200, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0373, partial_loss/deprel_loss: 0.7337, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0023, loss: 0.6889, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||: 67%|######7 | 64/95 [00:42<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9521, LAS: 0.9109, UEM: 0.6394, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4713, partial_loss/deprel_loss: 0.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6910, loss: 0.6820, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||: 71%|####### | 67/95 [00:44<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9529, LAS: 0.9116, UEM: 0.6413, LEM: 0.4155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4729, partial_loss/deprel_loss: 0.5493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7419, loss: 0.6771, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||: 75%|#######4 | 71/95 [00:47<00:16, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9530, LAS: 0.9115, UEM: 0.6350, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6252, loss: 0.6786, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||: 79%|#######8 | 75/95 [00:49<00:13, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9535, LAS: 0.9119, UEM: 0.6321, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2951, partial_loss/deprel_loss: 0.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.6769, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||: 83%|########3 | 79/95 [00:52<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9541, LAS: 0.9124, UEM: 0.6400, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4562, partial_loss/deprel_loss: 0.5250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.6728, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||: 86%|########6 | 82/95 [00:54<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9545, LAS: 0.9130, UEM: 0.6445, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2685, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5305, loss: 0.6686, batch_reg_loss: 0.2077, reg_loss: 0.2080 ||: 89%|########9 | 85/95 [00:56<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9535, LAS: 0.9119, UEM: 0.6368, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0026, partial_loss/deprel_loss: 0.7095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9758, loss: 0.6767, batch_reg_loss: 0.2077, reg_loss: 0.2080 ||: 93%|#########2| 88/95 [00:59<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9535, LAS: 0.9118, UEM: 0.6334, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.4044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5876, loss: 0.6783, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||: 97%|#########6| 92/95 [01:01<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9531, LAS: 0.9113, UEM: 0.6284, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6236, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8093, loss: 0.6821, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||: 100%|##########| 95/95 [01:03<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9531, LAS: 0.9113, UEM: 0.6284, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6236, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8093, loss: 0.6821, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 00:54:27,132 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9344, LAS: 0.8765, UEM: 0.4206, LEM: 0.1262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4799, partial_loss/deprel_loss: 34.4669, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8695, loss: 18.9120, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9525, LAS: 0.9021, UEM: 0.6547, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1809, partial_loss/deprel_loss: 8.1429, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5505, loss: 13.7622, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.02s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9503, LAS: 0.9009, UEM: 0.6862, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 6.0463, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8789, loss: 14.6505, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:08<00:03, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9518, LAS: 0.9015, UEM: 0.6800, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 9.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5400, loss: 13.5045, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9518, LAS: 0.9015, UEM: 0.6800, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 9.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5400, loss: 13.5045, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.03it/s]\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - reg_loss | 0.208 | 0.000\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - UEM | 0.628 | 0.680\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - LEM | 0.395 | 0.416\n", + "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EM | 0.900 | 0.921\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.624 | 0.408\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - UAS | 0.953 | 0.952\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.596 | 9.323\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - loss | 0.682 | 13.504\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - LAS | 0.911 | 0.901\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:54:37,865 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:54:43,239 - INFO - combo.training.trainer - Epoch duration: 0:01:23.092109\n", + "2023-04-07 00:54:43,239 - INFO - combo.training.trainer - Estimated training time remaining: 5:25:45\n", + "2023-04-07 00:54:43,240 - INFO - allennlp.training.trainer - Epoch 111/399\n", + "2023-04-07 00:54:43,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:54:43,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:54:43,251 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9590, LAS: 0.9166, UEM: 0.6606, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5436, partial_loss/deprel_loss: 0.5115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7256, loss: 0.6280, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||: 5%|5 | 5/95 [00:02<00:39, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9373, LAS: 0.8936, UEM: 0.5443, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8212, loss: 0.7938, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||: 9%|9 | 9/95 [00:04<00:42, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9437, LAS: 0.9003, UEM: 0.6005, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1950, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5739, loss: 0.7501, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||: 13%|#2 | 12/95 [00:06<00:45, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9476, LAS: 0.9040, UEM: 0.6031, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2522, partial_loss/deprel_loss: 0.4405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6105, loss: 0.7300, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||: 17%|#6 | 16/95 [00:09<00:44, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9514, LAS: 0.9084, UEM: 0.6514, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5003, loss: 0.6952, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||: 20%|## | 19/95 [00:11<00:47, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9505, LAS: 0.9072, UEM: 0.6217, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5095, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7701, loss: 0.7075, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||: 23%|##3 | 22/95 [00:13<00:48, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9532, LAS: 0.9101, UEM: 0.6547, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1771, partial_loss/deprel_loss: 0.3581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5295, loss: 0.6859, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||: 26%|##6 | 25/95 [00:15<00:46, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9536, LAS: 0.9108, UEM: 0.6392, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7453, loss: 0.6827, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||: 31%|### | 29/95 [00:18<00:42, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9540, LAS: 0.9114, UEM: 0.6238, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.6796, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||: 35%|###4 | 33/95 [00:20<00:38, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9668, UAS: 0.9550, LAS: 0.9132, UEM: 0.6617, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0337, partial_loss/deprel_loss: 0.1306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3188, loss: 0.6679, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 39%|###8 | 37/95 [00:24<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9540, LAS: 0.9120, UEM: 0.6489, LEM: 0.4159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9585, partial_loss/deprel_loss: 0.6945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9548, loss: 0.6778, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 43%|####3 | 41/95 [00:26<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9540, LAS: 0.9122, UEM: 0.6452, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4219, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.6761, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 46%|####6 | 44/95 [00:28<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9541, LAS: 0.9121, UEM: 0.6530, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3005, partial_loss/deprel_loss: 0.4328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6782, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 49%|####9 | 47/95 [00:31<00:35, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9541, LAS: 0.9122, UEM: 0.6494, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 0.3303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.6784, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 53%|#####2 | 50/95 [00:33<00:33, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9547, LAS: 0.9127, UEM: 0.6445, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3559, partial_loss/deprel_loss: 0.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.6742, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||: 57%|#####6 | 54/95 [00:36<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9557, LAS: 0.9136, UEM: 0.6559, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2399, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5708, loss: 0.6671, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||: 60%|###### | 57/95 [00:38<00:28, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9552, LAS: 0.9130, UEM: 0.6515, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2354, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5534, loss: 0.6727, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||: 64%|######4 | 61/95 [00:41<00:24, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9553, LAS: 0.9132, UEM: 0.6486, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2017, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5252, loss: 0.6709, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||: 68%|######8 | 65/95 [00:43<00:20, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9549, LAS: 0.9127, UEM: 0.6378, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.4096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.6746, batch_reg_loss: 0.2074, reg_loss: 0.2075 ||: 73%|#######2 | 69/95 [00:46<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9554, LAS: 0.9134, UEM: 0.6394, LEM: 0.3992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4656, partial_loss/deprel_loss: 0.5376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.6704, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 77%|#######6 | 73/95 [00:49<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9559, LAS: 0.9139, UEM: 0.6483, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.6655, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 81%|########1 | 77/95 [00:51<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9549, LAS: 0.9128, UEM: 0.6375, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7371, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.6732, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 85%|########5 | 81/95 [00:54<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9552, LAS: 0.9131, UEM: 0.6416, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.6706, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 88%|########8 | 84/95 [00:56<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9546, LAS: 0.9124, UEM: 0.6412, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.3788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5501, loss: 0.6747, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 93%|#########2| 88/95 [00:58<00:04, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9546, LAS: 0.9125, UEM: 0.6358, LEM: 0.3966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5872, loss: 0.6744, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 97%|#########6| 92/95 [01:01<00:01, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9548, LAS: 0.9128, UEM: 0.6377, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2456, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5708, loss: 0.6717, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 00:55:49,824 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - reg_loss | 0.207 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UEM | 0.638 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - LEM | 0.398 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.246 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.393 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - loss | 0.672 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - LAS | 0.913 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:55:49,830 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:55:54,628 - INFO - combo.training.trainer - Epoch duration: 0:01:11.388004\n", + "2023-04-07 00:55:54,628 - INFO - combo.training.trainer - Estimated training time remaining: 5:24:47\n", + "2023-04-07 00:55:54,628 - INFO - allennlp.training.trainer - Epoch 112/399\n", + "2023-04-07 00:55:54,629 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:55:54,629 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:55:54,638 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9541, LAS: 0.9113, UEM: 0.6700, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.6850, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||: 3%|3 | 3/95 [00:02<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9573, LAS: 0.9152, UEM: 0.6773, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1977, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.6647, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||: 6%|6 | 6/95 [00:04<01:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9541, LAS: 0.9116, UEM: 0.6053, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0969, partial_loss/deprel_loss: 0.7053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9908, loss: 0.6865, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||: 12%|#1 | 11/95 [00:06<00:54, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9544, LAS: 0.9121, UEM: 0.6304, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2483, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5873, loss: 0.6820, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||: 16%|#5 | 15/95 [00:08<00:49, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9508, LAS: 0.9085, UEM: 0.5879, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5111, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1616, loss: 0.7109, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||: 21%|##1 | 20/95 [00:11<00:43, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9532, LAS: 0.9110, UEM: 0.5929, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3499, partial_loss/deprel_loss: 0.4477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6353, loss: 0.6941, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 26%|##6 | 25/95 [00:13<00:38, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9550, LAS: 0.9132, UEM: 0.6118, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2080, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.6762, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 31%|### | 29/95 [00:16<00:38, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9534, LAS: 0.9113, UEM: 0.6007, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7130, loss: 0.6886, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 35%|###4 | 33/95 [00:19<00:38, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9525, LAS: 0.9106, UEM: 0.5940, LEM: 0.3442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7082, loss: 0.6925, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 39%|###8 | 37/95 [00:21<00:36, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9515, LAS: 0.9096, UEM: 0.5879, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5804, partial_loss/deprel_loss: 0.5401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7552, loss: 0.6975, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 43%|####3 | 41/95 [00:24<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9521, LAS: 0.9104, UEM: 0.5935, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8963, partial_loss/deprel_loss: 0.6886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9372, loss: 0.6926, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||: 47%|####7 | 45/95 [00:27<00:32, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9509, LAS: 0.9092, UEM: 0.5827, LEM: 0.3359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4573, partial_loss/deprel_loss: 0.5203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.7012, batch_reg_loss: 0.2071, reg_loss: 0.2071 ||: 52%|#####1 | 49/95 [00:29<00:29, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9512, LAS: 0.9096, UEM: 0.5857, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7286, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8670, loss: 0.6983, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||: 56%|#####5 | 53/95 [00:32<00:27, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9525, LAS: 0.9110, UEM: 0.5959, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1759, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.6898, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||: 60%|###### | 57/95 [00:35<00:25, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9532, LAS: 0.9117, UEM: 0.6244, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2594, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5584, loss: 0.6855, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||: 64%|######4 | 61/95 [00:38<00:25, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9535, LAS: 0.9120, UEM: 0.6219, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3242, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.6825, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||: 67%|######7 | 64/95 [00:41<00:22, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9537, LAS: 0.9123, UEM: 0.6160, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5349, partial_loss/deprel_loss: 0.5850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7820, loss: 0.6816, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||: 72%|#######1 | 68/95 [00:43<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9541, LAS: 0.9126, UEM: 0.6144, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5792, loss: 0.6797, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||: 76%|#######5 | 72/95 [00:45<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9540, LAS: 0.9126, UEM: 0.6114, LEM: 0.3713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 0.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7874, loss: 0.6779, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||: 80%|######## | 76/95 [00:48<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9537, LAS: 0.9124, UEM: 0.6128, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8648, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8876, loss: 0.6790, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||: 84%|########4 | 80/95 [00:51<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9539, LAS: 0.9127, UEM: 0.6176, LEM: 0.3807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.3326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.6768, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||: 88%|########8 | 84/95 [00:54<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9539, LAS: 0.9127, UEM: 0.6162, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7537, partial_loss/deprel_loss: 0.6348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8654, loss: 0.6763, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||: 92%|#########1| 87/95 [00:56<00:05, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9547, LAS: 0.9135, UEM: 0.6343, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0920, partial_loss/deprel_loss: 0.2665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4384, loss: 0.6691, batch_reg_loss: 0.2068, reg_loss: 0.2071 ||: 95%|#########4| 90/95 [00:58<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9546, LAS: 0.9134, UEM: 0.6399, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0046, partial_loss/deprel_loss: 0.6334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9145, loss: 0.6691, batch_reg_loss: 0.2068, reg_loss: 0.2070 ||: 98%|#########7| 93/95 [01:01<00:01, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9545, LAS: 0.9133, UEM: 0.6376, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 0.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8696, loss: 0.6706, batch_reg_loss: 0.2068, reg_loss: 0.2070 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - reg_loss | 0.207 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - UEM | 0.638 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - LEM | 0.404 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EM | 0.892 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.776 | N/A\n", + "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.635 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - loss | 0.671 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - LAS | 0.913 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:00,556 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:57:05,958 - INFO - combo.training.trainer - Epoch duration: 0:01:11.329365\n", + "2023-04-07 00:57:05,958 - INFO - combo.training.trainer - Estimated training time remaining: 5:23:49\n", + "2023-04-07 00:57:05,958 - INFO - allennlp.training.trainer - Epoch 113/399\n", + "2023-04-07 00:57:05,959 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:57:05,959 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:57:05,969 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9584, LAS: 0.9173, UEM: 0.6802, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1106, partial_loss/deprel_loss: 0.2887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4599, loss: 0.6359, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||: 4%|4 | 4/95 [00:02<01:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9530, LAS: 0.9123, UEM: 0.5739, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7199, partial_loss/deprel_loss: 0.5625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.6692, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||: 7%|7 | 7/95 [00:05<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9498, LAS: 0.9099, UEM: 0.5849, LEM: 0.3816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8978, partial_loss/deprel_loss: 0.6391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.6865, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||: 11%|# | 10/95 [00:07<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9471, LAS: 0.9058, UEM: 0.5426, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2796, partial_loss/deprel_loss: 0.7912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0956, loss: 0.7191, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||: 15%|#4 | 14/95 [00:09<00:56, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9484, LAS: 0.9070, UEM: 0.5279, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4803, partial_loss/deprel_loss: 0.4972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7005, loss: 0.7120, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||: 19%|#8 | 18/95 [00:12<00:52, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9518, LAS: 0.9112, UEM: 0.5883, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1955, partial_loss/deprel_loss: 0.3472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5235, loss: 0.6831, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||: 22%|##2 | 21/95 [00:14<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9522, LAS: 0.9115, UEM: 0.5883, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.5374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7270, loss: 0.6812, batch_reg_loss: 0.2067, reg_loss: 0.2067 ||: 27%|##7 | 26/95 [00:17<00:44, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9523, LAS: 0.9114, UEM: 0.5781, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5488, loss: 0.6800, batch_reg_loss: 0.2067, reg_loss: 0.2067 ||: 33%|###2 | 31/95 [00:19<00:37, 1.72it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9533, LAS: 0.9122, UEM: 0.5999, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7041, partial_loss/deprel_loss: 0.6440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8626, loss: 0.6761, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||: 38%|###7 | 36/95 [00:21<00:32, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9536, LAS: 0.9129, UEM: 0.5938, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.4526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6463, loss: 0.6712, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||: 43%|####3 | 41/95 [00:23<00:27, 1.97it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9542, LAS: 0.9137, UEM: 0.6311, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4491, partial_loss/deprel_loss: 0.5503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7366, loss: 0.6646, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||: 48%|####8 | 46/95 [00:27<00:28, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9545, LAS: 0.9140, UEM: 0.6245, LEM: 0.3965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3037, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.6616, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||: 53%|#####2 | 50/95 [00:30<00:28, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9544, LAS: 0.9136, UEM: 0.6169, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7795, partial_loss/deprel_loss: 0.6187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8574, loss: 0.6660, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||: 57%|#####6 | 54/95 [00:32<00:25, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9546, LAS: 0.9136, UEM: 0.6236, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0144, partial_loss/deprel_loss: 0.7123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9792, loss: 0.6655, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||: 61%|######1 | 58/95 [00:35<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9545, LAS: 0.9136, UEM: 0.6254, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6560, loss: 0.6656, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||: 65%|######5 | 62/95 [00:38<00:20, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9541, LAS: 0.9131, UEM: 0.6179, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7141, partial_loss/deprel_loss: 0.6444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8648, loss: 0.6699, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||: 69%|######9 | 66/95 [00:41<00:19, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9549, LAS: 0.9139, UEM: 0.6262, LEM: 0.3857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3050, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5887, loss: 0.6640, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||: 74%|#######3 | 70/95 [00:44<00:17, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9549, LAS: 0.9140, UEM: 0.6246, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3999, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6877, loss: 0.6638, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||: 77%|#######6 | 73/95 [00:46<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9554, LAS: 0.9145, UEM: 0.6319, LEM: 0.3919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.6601, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 80%|######## | 76/95 [00:48<00:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9548, LAS: 0.9138, UEM: 0.6278, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2888, partial_loss/deprel_loss: 0.4178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5984, loss: 0.6661, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 83%|########3 | 79/95 [00:51<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9551, LAS: 0.9141, UEM: 0.6284, LEM: 0.3882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1992, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4741, loss: 0.6631, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 87%|########7 | 83/95 [00:53<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9553, LAS: 0.9143, UEM: 0.6391, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.6611, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 91%|######### | 86/95 [00:56<00:06, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9544, LAS: 0.9134, UEM: 0.6323, LEM: 0.3953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4970, partial_loss/deprel_loss: 0.5067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7111, loss: 0.6680, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 94%|#########3| 89/95 [00:58<00:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9545, LAS: 0.9134, UEM: 0.6324, LEM: 0.3946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7042, partial_loss/deprel_loss: 0.6272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.6676, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 98%|#########7| 93/95 [01:00<00:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9549, LAS: 0.9138, UEM: 0.6379, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2131, partial_loss/deprel_loss: 0.3441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.6649, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - reg_loss | 0.207 | N/A\n", + "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UEM | 0.638 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LEM | 0.399 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - EM | 0.939 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.213 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.344 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - loss | 0.665 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LAS | 0.914 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:10,929 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:10,932 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:58:15,015 - INFO - combo.training.trainer - Epoch duration: 0:01:09.056259\n", + "2023-04-07 00:58:15,015 - INFO - combo.training.trainer - Estimated training time remaining: 5:22:44\n", + "2023-04-07 00:58:15,015 - INFO - allennlp.training.trainer - Epoch 114/399\n", + "2023-04-07 00:58:15,015 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:58:15,016 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:58:15,025 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9314, LAS: 0.8917, UEM: 0.7087, LEM: 0.5256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1108, partial_loss/deprel_loss: 0.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4566, loss: 0.7819, batch_reg_loss: 0.2064, reg_loss: 0.2064 ||: 3%|3 | 3/95 [00:04<02:07, 1.39s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9427, LAS: 0.9017, UEM: 0.5768, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5833, partial_loss/deprel_loss: 0.5521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7647, loss: 0.7315, batch_reg_loss: 0.2063, reg_loss: 0.2064 ||: 7%|7 | 7/95 [00:06<01:41, 1.15s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9447, LAS: 0.9032, UEM: 0.5226, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4223, partial_loss/deprel_loss: 0.4529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6531, loss: 0.7285, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 12%|#1 | 11/95 [00:08<01:22, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9483, LAS: 0.9059, UEM: 0.5293, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4901, partial_loss/deprel_loss: 0.5842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7717, loss: 0.7123, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 15%|#4 | 14/95 [00:11<01:12, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9464, LAS: 0.9037, UEM: 0.5079, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7024, partial_loss/deprel_loss: 0.6527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8690, loss: 0.7267, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 19%|#8 | 18/95 [00:13<01:02, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9472, LAS: 0.9046, UEM: 0.5318, LEM: 0.2996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.5741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.7191, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 22%|##2 | 21/95 [00:16<01:01, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9480, LAS: 0.9057, UEM: 0.5322, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.5636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7929, loss: 0.7136, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 25%|##5 | 24/95 [00:18<00:57, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9465, LAS: 0.9042, UEM: 0.5057, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8269, partial_loss/deprel_loss: 0.5861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8406, loss: 0.7281, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 28%|##8 | 27/95 [00:20<00:52, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9471, LAS: 0.9053, UEM: 0.5396, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6627, partial_loss/deprel_loss: 0.5766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.7164, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 33%|###2 | 31/95 [00:23<00:47, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9465, LAS: 0.9044, UEM: 0.5289, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6939, loss: 0.7222, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||: 36%|###5 | 34/95 [00:25<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9481, LAS: 0.9060, UEM: 0.5428, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 0.3679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.7106, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||: 40%|#### | 38/95 [00:27<00:39, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9504, LAS: 0.9085, UEM: 0.5692, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6906, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||: 45%|####5 | 43/95 [00:29<00:31, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9508, LAS: 0.9088, UEM: 0.5726, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8930, partial_loss/deprel_loss: 0.5813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8498, loss: 0.6889, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||: 49%|####9 | 47/95 [00:31<00:27, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9514, LAS: 0.9093, UEM: 0.5837, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1193, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.6875, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||: 55%|#####4 | 52/95 [00:33<00:23, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9684, UAS: 0.9524, LAS: 0.9107, UEM: 0.6082, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3095, loss: 0.6773, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||: 60%|###### | 57/95 [00:36<00:20, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9536, LAS: 0.9120, UEM: 0.6220, LEM: 0.3946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3440, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5596, loss: 0.6674, batch_reg_loss: 0.2061, reg_loss: 0.2063 ||: 64%|######4 | 61/95 [00:39<00:20, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9546, LAS: 0.9131, UEM: 0.6359, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2063, partial_loss/deprel_loss: 0.3269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5089, loss: 0.6604, batch_reg_loss: 0.2061, reg_loss: 0.2063 ||: 68%|######8 | 65/95 [00:42<00:19, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9554, LAS: 0.9141, UEM: 0.6416, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.6536, batch_reg_loss: 0.2061, reg_loss: 0.2062 ||: 73%|#######2 | 69/95 [00:45<00:17, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8658, UAS: 0.9554, LAS: 0.9140, UEM: 0.6468, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1753, partial_loss/deprel_loss: 0.7502, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0412, loss: 0.6552, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||: 77%|#######6 | 73/95 [00:48<00:14, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9550, LAS: 0.9135, UEM: 0.6371, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4383, partial_loss/deprel_loss: 0.5298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7175, loss: 0.6596, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||: 81%|########1 | 77/95 [00:50<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9551, LAS: 0.9139, UEM: 0.6423, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.5931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8761, loss: 0.6583, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||: 85%|########5 | 81/95 [00:53<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9553, LAS: 0.9140, UEM: 0.6380, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.3879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.6582, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||: 88%|########8 | 84/95 [00:55<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9553, LAS: 0.9139, UEM: 0.6417, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1078, partial_loss/deprel_loss: 0.8183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0821, loss: 0.6598, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||: 93%|#########2| 88/95 [00:58<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8461, UAS: 0.9549, LAS: 0.9136, UEM: 0.6432, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2994, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1180, loss: 0.6617, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||: 96%|#########5| 91/95 [01:00<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9545, LAS: 0.9133, UEM: 0.6382, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9167, partial_loss/deprel_loss: 0.6057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8738, loss: 0.6647, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||: 99%|#########8| 94/95 [01:02<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9546, LAS: 0.9133, UEM: 0.6378, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2826, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.6641, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 00:59:21,552 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - reg_loss | 0.206 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UEM | 0.638 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - LEM | 0.401 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EM | 0.918 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.283 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.430 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - loss | 0.664 | N/A\n", + "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - LAS | 0.913 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:59:21,559 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 00:59:26,252 - INFO - combo.training.trainer - Epoch duration: 0:01:11.236866\n", + "2023-04-07 00:59:26,253 - INFO - combo.training.trainer - Estimated training time remaining: 5:21:45\n", + "2023-04-07 00:59:26,253 - INFO - allennlp.training.trainer - Epoch 115/399\n", + "2023-04-07 00:59:26,253 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 00:59:26,254 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:59:26,263 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9542, LAS: 0.9129, UEM: 0.6562, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7398, partial_loss/deprel_loss: 0.5365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.6562, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||: 4%|4 | 4/95 [00:02<00:57, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9585, LAS: 0.9187, UEM: 0.7247, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4409, partial_loss/deprel_loss: 0.4558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6587, loss: 0.6120, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||: 7%|7 | 7/95 [00:04<00:58, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9611, LAS: 0.9198, UEM: 0.7109, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4914, partial_loss/deprel_loss: 0.5132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7147, loss: 0.6167, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||: 12%|#1 | 11/95 [00:07<00:56, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9596, LAS: 0.9177, UEM: 0.6701, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4028, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6679, loss: 0.6390, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||: 16%|#5 | 15/95 [00:09<00:51, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9672, UAS: 0.9599, LAS: 0.9190, UEM: 0.7118, LEM: 0.5007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3179, loss: 0.6322, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||: 20%|## | 19/95 [00:12<00:50, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9585, LAS: 0.9178, UEM: 0.6914, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7070, partial_loss/deprel_loss: 0.5902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8194, loss: 0.6418, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||: 23%|##3 | 22/95 [00:14<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9599, LAS: 0.9193, UEM: 0.6954, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2777, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.6282, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||: 27%|##7 | 26/95 [00:17<00:46, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9602, LAS: 0.9198, UEM: 0.6900, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6183, loss: 0.6251, batch_reg_loss: 0.2058, reg_loss: 0.2058 ||: 31%|### | 29/95 [00:19<00:45, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9577, LAS: 0.9172, UEM: 0.6820, LEM: 0.4575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9818, partial_loss/deprel_loss: 0.7060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9669, loss: 0.6465, batch_reg_loss: 0.2058, reg_loss: 0.2058 ||: 34%|###3 | 32/95 [00:21<00:44, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9580, LAS: 0.9176, UEM: 0.6762, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5369, loss: 0.6457, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 38%|###7 | 36/95 [00:24<00:40, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9559, LAS: 0.9156, UEM: 0.6609, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9257, partial_loss/deprel_loss: 0.6299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8948, loss: 0.6591, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 42%|####2 | 40/95 [00:26<00:36, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9558, LAS: 0.9156, UEM: 0.6678, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 0.3306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5086, loss: 0.6576, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 46%|####6 | 44/95 [00:29<00:34, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9563, LAS: 0.9161, UEM: 0.6686, LEM: 0.4403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1220, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4538, loss: 0.6523, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 51%|##### | 48/95 [00:32<00:30, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9555, LAS: 0.9151, UEM: 0.6544, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4670, partial_loss/deprel_loss: 0.4503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6593, loss: 0.6589, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 55%|#####4 | 52/95 [00:34<00:27, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9562, LAS: 0.9156, UEM: 0.6531, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4095, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.6558, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||: 59%|#####8 | 56/95 [00:37<00:25, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9563, LAS: 0.9158, UEM: 0.6507, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.4165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6027, loss: 0.6561, batch_reg_loss: 0.2056, reg_loss: 0.2058 ||: 64%|######4 | 61/95 [00:39<00:20, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9571, LAS: 0.9167, UEM: 0.6601, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2201, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.6494, batch_reg_loss: 0.2056, reg_loss: 0.2058 ||: 68%|######8 | 65/95 [00:42<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9568, LAS: 0.9164, UEM: 0.6540, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.3866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.6510, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||: 73%|#######2 | 69/95 [00:44<00:15, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8654, UAS: 0.9562, LAS: 0.9157, UEM: 0.6508, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0837, partial_loss/deprel_loss: 0.7093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9897, loss: 0.6556, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||: 77%|#######6 | 73/95 [00:47<00:13, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9558, LAS: 0.9151, UEM: 0.6487, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3352, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.6592, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||: 81%|########1 | 77/95 [00:49<00:11, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9558, LAS: 0.9152, UEM: 0.6437, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6079, loss: 0.6580, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 85%|########5 | 81/95 [00:52<00:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9558, LAS: 0.9151, UEM: 0.6405, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5322, partial_loss/deprel_loss: 0.6085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7987, loss: 0.6593, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 91%|######### | 86/95 [00:54<00:05, 1.69it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9556, LAS: 0.9149, UEM: 0.6366, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4661, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6402, loss: 0.6593, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 96%|#########5| 91/95 [00:57<00:02, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9553, LAS: 0.9146, UEM: 0.6385, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1003, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4344, loss: 0.6610, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 100%|##########| 95/95 [00:59<00:00, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9553, LAS: 0.9146, UEM: 0.6385, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1003, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4344, loss: 0.6610, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 100%|##########| 95/95 [00:59<00:00, 1.60it/s]\n", + "2023-04-07 01:00:28,704 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9416, LAS: 0.8932, UEM: 0.5811, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 10.4837, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4616, loss: 16.5237, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9379, LAS: 0.8831, UEM: 0.4572, LEM: 0.2129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0242, partial_loss/deprel_loss: 22.0818, partial_loss/cycle_loss: 0.0000, batch_loss: 17.8702, loss: 16.6606, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9457, LAS: 0.8922, UEM: 0.5791, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8919, partial_loss/deprel_loss: 15.8157, partial_loss/cycle_loss: 0.0000, batch_loss: 12.8309, loss: 14.5765, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9497, LAS: 0.8965, UEM: 0.6140, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4204, partial_loss/deprel_loss: 8.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6532, loss: 12.6692, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:01, 1.01s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9518, LAS: 0.9007, UEM: 0.6806, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 5.7408, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6375, loss: 11.9390, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.00it/s]\n", + "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - reg_loss | 0.206 | 0.000\n", + "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UEM | 0.639 | 0.681\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LEM | 0.405 | 0.414\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - EM | 0.944 | 0.943\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.100 | 0.224\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | 0.952\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.261 | 5.741\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - loss | 0.661 | 11.939\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LAS | 0.915 | 0.901\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:39,667 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:00:44,474 - INFO - combo.training.trainer - Epoch duration: 0:01:18.220975\n", + "2023-04-07 01:00:44,475 - INFO - combo.training.trainer - Estimated training time remaining: 5:21:03\n", + "2023-04-07 01:00:44,479 - INFO - allennlp.training.trainer - Epoch 116/399\n", + "2023-04-07 01:00:44,479 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:00:44,480 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:00:44,488 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9680, LAS: 0.9291, UEM: 0.7401, LEM: 0.4826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2020, partial_loss/deprel_loss: 0.3181, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5003, loss: 0.5417, batch_reg_loss: 0.2055, reg_loss: 0.2055 ||: 4%|4 | 4/95 [00:02<01:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9690, LAS: 0.9295, UEM: 0.7405, LEM: 0.4711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1814, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.5407, batch_reg_loss: 0.2055, reg_loss: 0.2055 ||: 7%|7 | 7/95 [00:04<01:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9584, LAS: 0.9176, UEM: 0.6493, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5633, partial_loss/deprel_loss: 0.6336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8250, loss: 0.6347, batch_reg_loss: 0.2054, reg_loss: 0.2055 ||: 12%|#1 | 11/95 [00:07<00:56, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9598, LAS: 0.9192, UEM: 0.6663, LEM: 0.4137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.3179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.6159, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||: 15%|#4 | 14/95 [00:09<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9610, LAS: 0.9200, UEM: 0.6714, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2278, partial_loss/deprel_loss: 0.3535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5338, loss: 0.6081, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||: 18%|#7 | 17/95 [00:11<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9594, LAS: 0.9186, UEM: 0.6447, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6805, partial_loss/deprel_loss: 0.5717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.6208, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||: 22%|##2 | 21/95 [00:14<00:49, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9585, LAS: 0.9173, UEM: 0.6355, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2706, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.6278, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||: 26%|##6 | 25/95 [00:16<00:45, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9571, LAS: 0.9159, UEM: 0.6217, LEM: 0.3660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5883, loss: 0.6413, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 29%|##9 | 28/95 [00:18<00:44, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9567, LAS: 0.9158, UEM: 0.6375, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0705, partial_loss/deprel_loss: 0.1764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3605, loss: 0.6432, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 33%|###2 | 31/95 [00:20<00:42, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9577, LAS: 0.9171, UEM: 0.6455, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2440, partial_loss/deprel_loss: 0.3688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.6353, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 37%|###6 | 35/95 [00:23<00:39, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9562, LAS: 0.9158, UEM: 0.6265, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8137, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8969, loss: 0.6497, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 41%|####1 | 39/95 [00:25<00:36, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9554, LAS: 0.9149, UEM: 0.6176, LEM: 0.3781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9319, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.6571, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 44%|####4 | 42/95 [00:28<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9563, LAS: 0.9159, UEM: 0.6318, LEM: 0.3923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1224, partial_loss/deprel_loss: 0.2459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4264, loss: 0.6486, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 47%|####7 | 45/95 [00:30<00:36, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9558, LAS: 0.9152, UEM: 0.6242, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5414, loss: 0.6522, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||: 52%|#####1 | 49/95 [00:32<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9558, LAS: 0.9153, UEM: 0.6202, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3851, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6734, loss: 0.6525, batch_reg_loss: 0.2052, reg_loss: 0.2054 ||: 56%|#####5 | 53/95 [00:35<00:27, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9565, LAS: 0.9161, UEM: 0.6234, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4648, partial_loss/deprel_loss: 0.4853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6864, loss: 0.6478, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 60%|###### | 57/95 [00:38<00:25, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9563, LAS: 0.9161, UEM: 0.6263, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3565, partial_loss/deprel_loss: 0.4152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6086, loss: 0.6477, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 63%|######3 | 60/95 [00:40<00:23, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9564, LAS: 0.9160, UEM: 0.6273, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4026, partial_loss/deprel_loss: 0.4820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6713, loss: 0.6483, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 66%|######6 | 63/95 [00:42<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9559, LAS: 0.9156, UEM: 0.6322, LEM: 0.3938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1012, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4372, loss: 0.6501, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 69%|######9 | 66/95 [00:44<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9554, LAS: 0.9151, UEM: 0.6282, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5122, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.6536, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 73%|#######2 | 69/95 [00:46<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9712, UAS: 0.9564, LAS: 0.9164, UEM: 0.6498, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0443, partial_loss/deprel_loss: 0.1197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3098, loss: 0.6467, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||: 76%|#######5 | 72/95 [00:48<00:16, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9566, LAS: 0.9165, UEM: 0.6545, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1457, partial_loss/deprel_loss: 0.3205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4907, loss: 0.6454, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||: 79%|#######8 | 75/95 [00:51<00:14, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9563, LAS: 0.9163, UEM: 0.6471, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2892, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6051, loss: 0.6474, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||: 84%|########4 | 80/95 [00:53<00:09, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9565, LAS: 0.9167, UEM: 0.6459, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.6453, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||: 89%|########9 | 85/95 [00:55<00:05, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9556, LAS: 0.9156, UEM: 0.6391, LEM: 0.4031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5147, partial_loss/deprel_loss: 0.8003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1483, loss: 0.6527, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||: 96%|#########5| 91/95 [00:58<00:02, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9550, LAS: 0.9149, UEM: 0.6400, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1389, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.6561, batch_reg_loss: 0.2050, reg_loss: 0.2053 ||: 100%|##########| 95/95 [01:01<00:00, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9550, LAS: 0.9149, UEM: 0.6400, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1389, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.6561, batch_reg_loss: 0.2050, reg_loss: 0.2053 ||: 100%|##########| 95/95 [01:01<00:00, 1.56it/s]\n", + "2023-04-07 01:01:48,450 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - reg_loss | 0.205 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - UEM | 0.640 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - LEM | 0.406 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EM | 0.938 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.139 | N/A\n", + "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.261 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - loss | 0.656 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - LAS | 0.915 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:48,459 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:01:53,134 - INFO - combo.training.trainer - Epoch duration: 0:01:08.655513\n", + "2023-04-07 01:01:53,135 - INFO - combo.training.trainer - Estimated training time remaining: 5:19:57\n", + "2023-04-07 01:01:53,135 - INFO - allennlp.training.trainer - Epoch 117/399\n", + "2023-04-07 01:01:53,135 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:01:53,136 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:01:53,144 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9657, LAS: 0.9271, UEM: 0.7289, LEM: 0.5060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3055, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.5641, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 3%|3 | 3/95 [00:02<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9583, LAS: 0.9174, UEM: 0.6494, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6166, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8207, loss: 0.6446, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 6%|6 | 6/95 [00:04<01:07, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9613, LAS: 0.9211, UEM: 0.6669, LEM: 0.4219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5055, loss: 0.6202, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 9%|9 | 9/95 [00:06<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9620, LAS: 0.9220, UEM: 0.7170, LEM: 0.4787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1334, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4405, loss: 0.6061, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 14%|#3 | 13/95 [00:09<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9627, LAS: 0.9226, UEM: 0.7430, LEM: 0.5152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.3888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.6003, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 17%|#6 | 16/95 [00:11<01:00, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9614, LAS: 0.9207, UEM: 0.7180, LEM: 0.4855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4569, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7523, loss: 0.6153, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 20%|## | 19/95 [00:14<00:56, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9606, LAS: 0.9204, UEM: 0.7169, LEM: 0.4907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5126, partial_loss/deprel_loss: 0.4923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.6176, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||: 23%|##3 | 22/95 [00:16<00:55, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9598, LAS: 0.9194, UEM: 0.7115, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9651, partial_loss/deprel_loss: 0.6207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8945, loss: 0.6246, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 26%|##6 | 25/95 [00:18<00:52, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9586, LAS: 0.9184, UEM: 0.6856, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4719, partial_loss/deprel_loss: 0.5116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.6347, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 31%|### | 29/95 [00:21<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9597, LAS: 0.9202, UEM: 0.7099, LEM: 0.4931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0503, partial_loss/deprel_loss: 0.1543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3384, loss: 0.6270, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 34%|###3 | 32/95 [00:23<00:46, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9611, LAS: 0.9215, UEM: 0.7257, LEM: 0.5059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0998, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4409, loss: 0.6144, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 37%|###6 | 35/95 [00:26<00:45, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9609, LAS: 0.9211, UEM: 0.7160, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.6155, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 40%|#### | 38/95 [00:28<00:42, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9587, LAS: 0.9188, UEM: 0.6991, LEM: 0.4793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5246, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.6316, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||: 43%|####3 | 41/95 [00:30<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9591, LAS: 0.9193, UEM: 0.6970, LEM: 0.4749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2204, partial_loss/deprel_loss: 0.2553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.6274, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 46%|####6 | 44/95 [00:32<00:37, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9577, LAS: 0.9178, UEM: 0.6826, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6035, partial_loss/deprel_loss: 0.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7632, loss: 0.6391, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 49%|####9 | 47/95 [00:34<00:35, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9578, LAS: 0.9179, UEM: 0.6828, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2021, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5363, loss: 0.6393, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 53%|#####2 | 50/95 [00:36<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9569, LAS: 0.9169, UEM: 0.6781, LEM: 0.4556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2868, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6455, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 56%|#####5 | 53/95 [00:39<00:31, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9556, LAS: 0.9155, UEM: 0.6716, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0218, partial_loss/deprel_loss: 0.7471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0068, loss: 0.6539, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 60%|###### | 57/95 [00:41<00:26, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9559, LAS: 0.9157, UEM: 0.6668, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4642, partial_loss/deprel_loss: 0.4842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6850, loss: 0.6526, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 64%|######4 | 61/95 [00:43<00:22, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9561, LAS: 0.9162, UEM: 0.6638, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4905, partial_loss/deprel_loss: 0.4883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6513, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 68%|######8 | 65/95 [00:46<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9557, LAS: 0.9158, UEM: 0.6566, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7983, partial_loss/deprel_loss: 0.5908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8371, loss: 0.6525, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 73%|#######2 | 69/95 [00:48<00:16, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9296, UAS: 0.9558, LAS: 0.9159, UEM: 0.6555, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5796, loss: 0.6534, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||: 77%|#######6 | 73/95 [00:52<00:15, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9562, LAS: 0.9163, UEM: 0.6571, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.6500, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||: 80%|######## | 76/95 [00:54<00:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9569, LAS: 0.9168, UEM: 0.6612, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2000, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5333, loss: 0.6461, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||: 83%|########3 | 79/95 [00:56<00:11, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9569, LAS: 0.9167, UEM: 0.6574, LEM: 0.4224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6471, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||: 86%|########6 | 82/95 [00:59<00:09, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9563, LAS: 0.9161, UEM: 0.6521, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4103, partial_loss/deprel_loss: 0.4323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.6524, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||: 89%|########9 | 85/95 [01:01<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9564, LAS: 0.9163, UEM: 0.6528, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3299, partial_loss/deprel_loss: 0.3959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.6503, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||: 94%|#########3| 89/95 [01:03<00:03, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9563, LAS: 0.9160, UEM: 0.6453, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6606, loss: 0.6513, batch_reg_loss: 0.2047, reg_loss: 0.2048 ||: 99%|#########8| 94/95 [01:05<00:00, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9564, LAS: 0.9161, UEM: 0.6459, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.6502, batch_reg_loss: 0.2047, reg_loss: 0.2048 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-07 01:03:01,644 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - reg_loss | 0.205 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UEM | 0.646 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - LEM | 0.409 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EM | 0.921 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.252 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.369 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - loss | 0.650 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - LAS | 0.916 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:03:01,652 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:03:05,803 - INFO - combo.training.trainer - Epoch duration: 0:01:12.667929\n", + "2023-04-07 01:03:05,803 - INFO - combo.training.trainer - Estimated training time remaining: 5:19:01\n", + "2023-04-07 01:03:05,803 - INFO - allennlp.training.trainer - Epoch 118/399\n", + "2023-04-07 01:03:05,807 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:03:05,808 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:03:05,814 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9398, LAS: 0.8988, UEM: 0.3985, LEM: 0.2055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7798, partial_loss/deprel_loss: 0.6197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8564, loss: 0.7712, batch_reg_loss: 0.2046, reg_loss: 0.2047 ||: 4%|4 | 4/95 [00:02<00:54, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9468, LAS: 0.9063, UEM: 0.5245, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.3276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4980, loss: 0.7248, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 8%|8 | 8/95 [00:05<00:54, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9524, LAS: 0.9122, UEM: 0.5617, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4304, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6557, loss: 0.6857, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 13%|#2 | 12/95 [00:07<00:53, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9504, LAS: 0.9102, UEM: 0.5473, LEM: 0.3003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3414, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.6945, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 16%|#5 | 15/95 [00:10<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9525, LAS: 0.9133, UEM: 0.5967, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6889, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8063, loss: 0.6762, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 20%|## | 19/95 [00:12<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9561, LAS: 0.9172, UEM: 0.6425, LEM: 0.4060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1962, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6493, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 24%|##4 | 23/95 [00:15<00:48, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9572, LAS: 0.9185, UEM: 0.6440, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5588, loss: 0.6393, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||: 28%|##8 | 27/95 [00:17<00:43, 1.56it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9580, LAS: 0.9192, UEM: 0.6569, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.2687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4512, loss: 0.6296, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||: 33%|###2 | 31/95 [00:20<00:41, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9586, LAS: 0.9196, UEM: 0.6521, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5693, loss: 0.6243, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||: 37%|###6 | 35/95 [00:23<00:39, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9578, LAS: 0.9188, UEM: 0.6441, LEM: 0.4000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6328, loss: 0.6311, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||: 40%|#### | 38/95 [00:25<00:37, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9587, LAS: 0.9196, UEM: 0.6489, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.6265, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||: 43%|####3 | 41/95 [00:27<00:36, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9579, LAS: 0.9185, UEM: 0.6353, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4702, partial_loss/deprel_loss: 0.5163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.6337, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||: 46%|####6 | 44/95 [00:29<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9577, LAS: 0.9182, UEM: 0.6388, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5220, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6353, batch_reg_loss: 0.2044, reg_loss: 0.2046 ||: 49%|####9 | 47/95 [00:31<00:33, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9570, LAS: 0.9176, UEM: 0.6303, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5341, loss: 0.6409, batch_reg_loss: 0.2044, reg_loss: 0.2046 ||: 53%|#####2 | 50/95 [00:33<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9577, LAS: 0.9183, UEM: 0.6410, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1441, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4514, loss: 0.6355, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||: 56%|#####5 | 53/95 [00:35<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9579, LAS: 0.9183, UEM: 0.6397, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6037, loss: 0.6348, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||: 59%|#####8 | 56/95 [00:38<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9582, LAS: 0.9185, UEM: 0.6424, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4151, partial_loss/deprel_loss: 0.4470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.6306, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||: 62%|######2 | 59/95 [00:40<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9582, LAS: 0.9184, UEM: 0.6424, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5443, partial_loss/deprel_loss: 0.5232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7318, loss: 0.6310, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||: 65%|######5 | 62/95 [00:42<00:23, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9578, LAS: 0.9181, UEM: 0.6436, LEM: 0.4004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.6327, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||: 68%|######8 | 65/95 [00:44<00:22, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9586, LAS: 0.9189, UEM: 0.6586, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5060, loss: 0.6260, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 72%|#######1 | 68/95 [00:47<00:20, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9582, LAS: 0.9185, UEM: 0.6553, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7309, partial_loss/deprel_loss: 0.5876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8206, loss: 0.6301, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 75%|#######4 | 71/95 [00:49<00:18, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9575, LAS: 0.9177, UEM: 0.6469, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4428, partial_loss/deprel_loss: 0.4354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6412, loss: 0.6368, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 78%|#######7 | 74/95 [00:51<00:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9564, LAS: 0.9164, UEM: 0.6414, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5772, loss: 0.6446, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 81%|########1 | 77/95 [00:54<00:13, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9566, LAS: 0.9169, UEM: 0.6540, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7177, partial_loss/deprel_loss: 0.5827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8140, loss: 0.6425, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 84%|########4 | 80/95 [00:56<00:11, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9564, LAS: 0.9167, UEM: 0.6479, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1983, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5313, loss: 0.6447, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 88%|########8 | 84/95 [00:58<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9568, LAS: 0.9170, UEM: 0.6508, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4443, partial_loss/deprel_loss: 0.4700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6691, loss: 0.6432, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 92%|#########1| 87/95 [01:01<00:05, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9559, LAS: 0.9159, UEM: 0.6427, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7055, partial_loss/deprel_loss: 0.6593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8728, loss: 0.6516, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||: 96%|#########5| 91/95 [01:03<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9562, LAS: 0.9163, UEM: 0.6432, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.4098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6499, batch_reg_loss: 0.2043, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:05<00:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9562, LAS: 0.9163, UEM: 0.6432, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.4098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6499, batch_reg_loss: 0.2043, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - reg_loss | 0.204 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - UEM | 0.643 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - LEM | 0.409 | N/A\n", + "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.310 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.410 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - loss | 0.650 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - LAS | 0.916 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:14,736 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:04:19,866 - INFO - combo.training.trainer - Epoch duration: 0:01:14.062399\n", + "2023-04-07 01:04:19,866 - INFO - combo.training.trainer - Estimated training time remaining: 5:18:08\n", + "2023-04-07 01:04:19,867 - INFO - allennlp.training.trainer - Epoch 119/399\n", + "2023-04-07 01:04:19,867 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:04:19,868 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:04:19,877 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9680, LAS: 0.9297, UEM: 0.7144, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.3151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5497, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||: 5%|5 | 5/95 [00:02<00:37, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9658, LAS: 0.9279, UEM: 0.7102, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.5502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7768, loss: 0.5636, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||: 11%|# | 10/95 [00:04<00:37, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9595, LAS: 0.9203, UEM: 0.6506, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5168, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.6185, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||: 15%|#4 | 14/95 [00:07<00:40, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9612, LAS: 0.9225, UEM: 0.6805, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1406, partial_loss/deprel_loss: 0.2792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.6006, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||: 18%|#7 | 17/95 [00:09<00:47, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9611, LAS: 0.9216, UEM: 0.6632, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.5895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8029, loss: 0.6072, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||: 22%|##2 | 21/95 [00:12<00:46, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9596, LAS: 0.9201, UEM: 0.6629, LEM: 0.4254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.5451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.6138, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 25%|##5 | 24/95 [00:14<00:45, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9589, LAS: 0.9196, UEM: 0.6462, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2599, partial_loss/deprel_loss: 0.3826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5622, loss: 0.6170, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 29%|##9 | 28/95 [00:17<00:44, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9607, LAS: 0.9210, UEM: 0.6755, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5445, loss: 0.6047, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 33%|###2 | 31/95 [00:19<00:45, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9595, LAS: 0.9196, UEM: 0.6593, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2287, partial_loss/deprel_loss: 0.3646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5415, loss: 0.6169, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 37%|###6 | 35/95 [00:22<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9577, LAS: 0.9178, UEM: 0.6494, LEM: 0.4099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5927, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7327, loss: 0.6291, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 40%|#### | 38/95 [00:24<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.9555, LAS: 0.9152, UEM: 0.6316, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4118, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0912, loss: 0.6490, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||: 44%|####4 | 42/95 [00:26<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9555, LAS: 0.9152, UEM: 0.6242, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4271, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.6491, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 48%|####8 | 46/95 [00:29<00:31, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9555, LAS: 0.9153, UEM: 0.6226, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4376, loss: 0.6464, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 53%|#####2 | 50/95 [00:31<00:28, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9567, LAS: 0.9167, UEM: 0.6471, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1921, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4806, loss: 0.6348, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 57%|#####6 | 54/95 [00:35<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9551, LAS: 0.9151, UEM: 0.6367, LEM: 0.4053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3423, partial_loss/deprel_loss: 0.7008, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0331, loss: 0.6454, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 60%|###### | 57/95 [00:37<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9559, LAS: 0.9158, UEM: 0.6492, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5286, loss: 0.6408, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 63%|######3 | 60/95 [00:39<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9561, LAS: 0.9162, UEM: 0.6626, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8539, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8731, loss: 0.6397, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 66%|######6 | 63/95 [00:41<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9565, LAS: 0.9165, UEM: 0.6619, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.6368, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||: 71%|####### | 67/95 [00:44<00:20, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9563, LAS: 0.9162, UEM: 0.6544, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3891, partial_loss/deprel_loss: 0.4232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.6394, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 75%|#######4 | 71/95 [00:47<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9556, LAS: 0.9155, UEM: 0.6502, LEM: 0.4245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.2808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4618, loss: 0.6453, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 79%|#######8 | 75/95 [00:49<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9363, UAS: 0.9553, LAS: 0.9152, UEM: 0.6450, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1619, partial_loss/deprel_loss: 0.3237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.6480, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 83%|########3 | 79/95 [00:52<00:10, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9551, LAS: 0.9150, UEM: 0.6381, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.6701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8823, loss: 0.6514, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 87%|########7 | 83/95 [00:55<00:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9554, LAS: 0.9153, UEM: 0.6370, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4684, partial_loss/deprel_loss: 0.5085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7044, loss: 0.6494, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 91%|######### | 86/95 [00:57<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9557, LAS: 0.9156, UEM: 0.6374, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2779, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5975, loss: 0.6469, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 94%|#########3| 89/95 [00:59<00:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9557, LAS: 0.9154, UEM: 0.6349, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.6025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.6483, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||: 97%|#########6| 92/95 [01:01<00:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9558, LAS: 0.9156, UEM: 0.6386, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6477, batch_reg_loss: 0.2039, reg_loss: 0.2040 ||: 100%|##########| 95/95 [01:04<00:00, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9558, LAS: 0.9156, UEM: 0.6386, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6477, batch_reg_loss: 0.2039, reg_loss: 0.2040 ||: 100%|##########| 95/95 [01:04<00:00, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - reg_loss | 0.204 | N/A\n", + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - UEM | 0.639 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LEM | 0.407 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - EM | 0.936 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.224 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.348 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - loss | 0.648 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LAS | 0.916 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:27,556 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:05:32,555 - INFO - combo.training.trainer - Epoch duration: 0:01:12.688653\n", + "2023-04-07 01:05:32,556 - INFO - combo.training.trainer - Estimated training time remaining: 5:17:11\n", + "2023-04-07 01:05:32,556 - INFO - allennlp.training.trainer - Epoch 120/399\n", + "2023-04-07 01:05:32,556 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:05:32,557 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:05:32,567 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9607, LAS: 0.9192, UEM: 0.6978, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8741, partial_loss/deprel_loss: 0.6850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9267, loss: 0.6465, batch_reg_loss: 0.2039, reg_loss: 0.2039 ||: 4%|4 | 4/95 [00:02<00:57, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9641, LAS: 0.9246, UEM: 0.7115, LEM: 0.4575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4423, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.5976, batch_reg_loss: 0.2038, reg_loss: 0.2039 ||: 7%|7 | 7/95 [00:04<00:58, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9647, LAS: 0.9252, UEM: 0.7035, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4366, partial_loss/deprel_loss: 0.4334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.5810, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||: 13%|#2 | 12/95 [00:06<00:49, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9593, LAS: 0.9201, UEM: 0.6765, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.6190, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||: 17%|#6 | 16/95 [00:09<00:45, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9571, LAS: 0.9183, UEM: 0.6765, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0005, partial_loss/deprel_loss: 0.6994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9634, loss: 0.6334, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||: 22%|##2 | 21/95 [00:11<00:40, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9577, LAS: 0.9187, UEM: 0.6619, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4076, partial_loss/deprel_loss: 0.5277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7075, loss: 0.6312, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||: 26%|##6 | 25/95 [00:13<00:38, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9590, LAS: 0.9198, UEM: 0.6632, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6214, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 31%|### | 29/95 [00:16<00:37, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9589, LAS: 0.9198, UEM: 0.6604, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6513, partial_loss/deprel_loss: 0.5765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7952, loss: 0.6228, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 35%|###4 | 33/95 [00:19<00:38, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9584, LAS: 0.9192, UEM: 0.6470, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3922, partial_loss/deprel_loss: 0.4201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.6277, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 39%|###8 | 37/95 [00:21<00:35, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9585, LAS: 0.9190, UEM: 0.6380, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3262, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.6304, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 43%|####3 | 41/95 [00:24<00:35, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9584, LAS: 0.9187, UEM: 0.6337, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2109, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5713, loss: 0.6353, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 47%|####7 | 45/95 [00:26<00:32, 1.56it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9592, LAS: 0.9196, UEM: 0.6479, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0840, partial_loss/deprel_loss: 0.2389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.6285, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||: 52%|#####1 | 49/95 [00:30<00:32, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9584, LAS: 0.9189, UEM: 0.6377, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6546, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.6337, batch_reg_loss: 0.2036, reg_loss: 0.2038 ||: 56%|#####5 | 53/95 [00:32<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9571, LAS: 0.9176, UEM: 0.6324, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.3608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.6433, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9569, LAS: 0.9173, UEM: 0.6276, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6429, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8400, loss: 0.6461, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 62%|######2 | 59/95 [00:37<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9704, UAS: 0.9578, LAS: 0.9186, UEM: 0.6535, LEM: 0.4186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0350, partial_loss/deprel_loss: 0.1191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3059, loss: 0.6387, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 65%|######5 | 62/95 [00:39<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9576, LAS: 0.9183, UEM: 0.6445, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5544, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.6401, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 69%|######9 | 66/95 [00:41<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9575, LAS: 0.9182, UEM: 0.6455, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6521, partial_loss/deprel_loss: 0.6149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8259, loss: 0.6402, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 73%|#######2 | 69/95 [00:44<00:18, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9570, LAS: 0.9177, UEM: 0.6504, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1028, partial_loss/deprel_loss: 0.1930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3785, loss: 0.6430, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 76%|#######5 | 72/95 [00:46<00:16, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9560, LAS: 0.9166, UEM: 0.6452, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.3310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5121, loss: 0.6504, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 80%|######## | 76/95 [00:48<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9562, LAS: 0.9168, UEM: 0.6437, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4998, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.6489, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||: 84%|########4 | 80/95 [00:51<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9564, LAS: 0.9170, UEM: 0.6455, LEM: 0.4172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3524, partial_loss/deprel_loss: 0.3942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5894, loss: 0.6464, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||: 88%|########8 | 84/95 [00:53<00:07, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9565, LAS: 0.9170, UEM: 0.6404, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.4616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6478, loss: 0.6465, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||: 93%|#########2| 88/95 [00:56<00:04, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9563, LAS: 0.9166, UEM: 0.6429, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2583, partial_loss/deprel_loss: 0.3898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5670, loss: 0.6479, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||: 97%|#########6| 92/95 [00:59<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9562, LAS: 0.9165, UEM: 0.6439, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6464, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7945, loss: 0.6475, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 01:06:36,825 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9550, LAS: 0.9072, UEM: 0.7556, LEM: 0.5511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1711, partial_loss/deprel_loss: 23.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0432, loss: 11.8022, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9537, LAS: 0.9059, UEM: 0.7448, LEM: 0.5037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 7.0066, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6395, loss: 11.6950, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.09it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9520, LAS: 0.9009, UEM: 0.6977, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0938, partial_loss/deprel_loss: 20.2974, partial_loss/cycle_loss: 0.0000, batch_loss: 16.4566, loss: 11.4879, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:07<00:01, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9515, LAS: 0.9014, UEM: 0.6811, LEM: 0.4059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0456, partial_loss/deprel_loss: 12.9410, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5620, loss: 11.0767, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.16it/s]\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - reg_loss | 0.204 | 0.000\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - UEM | 0.644 | 0.681\n", + "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - LEM | 0.411 | 0.406\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - EM | 0.906 | 0.879\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.646 | 1.046\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | 0.952\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.577 | 12.941\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - loss | 0.648 | 11.077\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - LAS | 0.917 | 0.901\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:06:46,336 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:06:52,753 - INFO - combo.training.trainer - Epoch duration: 0:01:20.197188\n", + "2023-04-07 01:06:52,754 - INFO - combo.training.trainer - Estimated training time remaining: 5:16:31\n", + "2023-04-07 01:06:52,754 - INFO - allennlp.training.trainer - Epoch 121/399\n", + "2023-04-07 01:06:52,754 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:06:52,755 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:06:52,764 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9657, LAS: 0.9285, UEM: 0.7889, LEM: 0.6036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4974, partial_loss/deprel_loss: 0.5193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 0.5442, batch_reg_loss: 0.2035, reg_loss: 0.2035 ||: 3%|3 | 3/95 [00:02<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9615, LAS: 0.9228, UEM: 0.7172, LEM: 0.5127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4871, loss: 0.5970, batch_reg_loss: 0.2035, reg_loss: 0.2035 ||: 7%|7 | 7/95 [00:04<00:57, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9591, LAS: 0.9207, UEM: 0.6577, LEM: 0.4435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2278, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4752, loss: 0.6176, batch_reg_loss: 0.2034, reg_loss: 0.2035 ||: 13%|#2 | 12/95 [00:06<00:50, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9604, LAS: 0.9221, UEM: 0.6761, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3532, partial_loss/deprel_loss: 0.4561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6389, loss: 0.6078, batch_reg_loss: 0.2034, reg_loss: 0.2035 ||: 17%|#6 | 16/95 [00:09<00:48, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9605, LAS: 0.9217, UEM: 0.6605, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4820, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6695, loss: 0.6117, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||: 21%|##1 | 20/95 [00:11<00:45, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9606, LAS: 0.9215, UEM: 0.6706, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.3131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.6099, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||: 25%|##5 | 24/95 [00:14<00:43, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9551, LAS: 0.9160, UEM: 0.6458, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0604, partial_loss/deprel_loss: 0.6867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9648, loss: 0.6471, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||: 28%|##8 | 27/95 [00:16<00:43, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9537, LAS: 0.9144, UEM: 0.6245, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0133, partial_loss/deprel_loss: 0.7242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9854, loss: 0.6621, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||: 33%|###2 | 31/95 [00:18<00:39, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9545, LAS: 0.9156, UEM: 0.6416, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.3377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.6512, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 37%|###6 | 35/95 [00:20<00:36, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9555, LAS: 0.9166, UEM: 0.6503, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.6435, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 41%|####1 | 39/95 [00:22<00:32, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9564, LAS: 0.9176, UEM: 0.6608, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5306, partial_loss/deprel_loss: 0.5478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.6387, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 46%|####6 | 44/95 [00:25<00:27, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9563, LAS: 0.9174, UEM: 0.6605, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7088, loss: 0.6393, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 51%|##### | 48/95 [00:28<00:27, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9548, LAS: 0.9160, UEM: 0.6715, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0341, partial_loss/deprel_loss: 0.1105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2985, loss: 0.6491, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 55%|#####4 | 52/95 [00:31<00:27, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9543, LAS: 0.9154, UEM: 0.6605, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7332, partial_loss/deprel_loss: 0.5672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8036, loss: 0.6531, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9547, LAS: 0.9155, UEM: 0.6511, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6969, loss: 0.6522, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||: 63%|######3 | 60/95 [00:36<00:23, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9260, UAS: 0.9550, LAS: 0.9158, UEM: 0.6472, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.6503, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||: 66%|######6 | 63/95 [00:39<00:22, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9551, LAS: 0.9158, UEM: 0.6459, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.5283, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.6498, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||: 69%|######9 | 66/95 [00:41<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9557, LAS: 0.9162, UEM: 0.6485, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5249, loss: 0.6453, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||: 73%|#######2 | 69/95 [00:43<00:17, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9565, LAS: 0.9170, UEM: 0.6550, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2400, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5552, loss: 0.6408, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||: 76%|#######5 | 72/95 [00:45<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9564, LAS: 0.9168, UEM: 0.6488, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3583, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5980, loss: 0.6432, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||: 80%|######## | 76/95 [00:47<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9573, LAS: 0.9176, UEM: 0.6578, LEM: 0.4263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1597, partial_loss/deprel_loss: 0.3499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.6371, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||: 84%|########4 | 80/95 [00:51<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9572, LAS: 0.9176, UEM: 0.6526, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8893, partial_loss/deprel_loss: 0.6400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8930, loss: 0.6384, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 88%|########8 | 84/95 [00:53<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9575, LAS: 0.9180, UEM: 0.6517, LEM: 0.4188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2876, partial_loss/deprel_loss: 0.4038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.6361, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 93%|#########2| 88/95 [00:56<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9578, LAS: 0.9182, UEM: 0.6517, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 0.4666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6582, loss: 0.6346, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 96%|#########5| 91/95 [00:58<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9572, LAS: 0.9176, UEM: 0.6478, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3699, partial_loss/deprel_loss: 0.4647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.6397, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 99%|#########8| 94/95 [01:00<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9570, LAS: 0.9174, UEM: 0.6454, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7064, partial_loss/deprel_loss: 0.5231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7628, loss: 0.6410, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 100%|##########| 95/95 [01:00<00:00, 1.56it/s]\n", + "2023-04-07 01:07:56,773 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - reg_loss | 0.203 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UEM | 0.645 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - LEM | 0.411 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EM | 0.904 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.706 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.523 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - loss | 0.641 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - LAS | 0.917 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:07:56,780 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:08:01,559 - INFO - combo.training.trainer - Epoch duration: 0:01:08.804784\n", + "2023-04-07 01:08:01,559 - INFO - combo.training.trainer - Estimated training time remaining: 5:15:25\n", + "2023-04-07 01:08:01,559 - INFO - allennlp.training.trainer - Epoch 122/399\n", + "2023-04-07 01:08:01,559 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:08:01,560 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:08:01,568 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9522, LAS: 0.9092, UEM: 0.6411, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2410, partial_loss/deprel_loss: 0.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6883, batch_reg_loss: 0.2031, reg_loss: 0.2031 ||: 4%|4 | 4/95 [00:02<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9574, LAS: 0.9141, UEM: 0.6795, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6053, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7961, loss: 0.6567, batch_reg_loss: 0.2031, reg_loss: 0.2031 ||: 7%|7 | 7/95 [00:04<01:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9607, LAS: 0.9189, UEM: 0.6862, LEM: 0.4099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1805, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6337, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||: 12%|#1 | 11/95 [00:07<00:58, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9631, LAS: 0.9222, UEM: 0.7088, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2324, partial_loss/deprel_loss: 0.3625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.6084, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||: 15%|#4 | 14/95 [00:10<00:59, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9604, LAS: 0.9200, UEM: 0.6754, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8685, partial_loss/deprel_loss: 0.5884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8475, loss: 0.6257, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||: 19%|#8 | 18/95 [00:12<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9579, LAS: 0.9176, UEM: 0.6667, LEM: 0.4036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4474, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1328, loss: 0.6446, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 22%|##2 | 21/95 [00:14<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9560, LAS: 0.9159, UEM: 0.6531, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2114, partial_loss/deprel_loss: 0.6714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.6546, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 25%|##5 | 24/95 [00:17<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9556, LAS: 0.9155, UEM: 0.6472, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1760, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.6565, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 28%|##8 | 27/95 [00:19<00:51, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9556, LAS: 0.9157, UEM: 0.6317, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7273, partial_loss/deprel_loss: 0.5864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.6584, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 33%|###2 | 31/95 [00:22<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9570, LAS: 0.9178, UEM: 0.6732, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.6434, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||: 36%|###5 | 34/95 [00:24<00:45, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9577, LAS: 0.9184, UEM: 0.6754, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6310, partial_loss/deprel_loss: 0.5785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7920, loss: 0.6375, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 40%|#### | 38/95 [00:27<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9576, LAS: 0.9185, UEM: 0.6792, LEM: 0.4450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.4232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.6361, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 43%|####3 | 41/95 [00:29<00:39, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9574, LAS: 0.9182, UEM: 0.6802, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3893, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.6373, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 48%|####8 | 46/95 [00:31<00:32, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9577, LAS: 0.9183, UEM: 0.6801, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6569, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8026, loss: 0.6332, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 54%|#####3 | 51/95 [00:34<00:26, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9563, LAS: 0.9167, UEM: 0.6622, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7220, loss: 0.6428, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 59%|#####8 | 56/95 [00:36<00:21, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9564, LAS: 0.9165, UEM: 0.6609, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1120, partial_loss/deprel_loss: 0.2517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4266, loss: 0.6454, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||: 63%|######3 | 60/95 [00:39<00:19, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9566, LAS: 0.9166, UEM: 0.6570, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2082, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.6445, batch_reg_loss: 0.2028, reg_loss: 0.2030 ||: 67%|######7 | 64/95 [00:41<00:17, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9565, LAS: 0.9165, UEM: 0.6534, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5188, loss: 0.6468, batch_reg_loss: 0.2028, reg_loss: 0.2030 ||: 72%|#######1 | 68/95 [00:44<00:16, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9368, UAS: 0.9571, LAS: 0.9168, UEM: 0.6561, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1879, partial_loss/deprel_loss: 0.3157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4929, loss: 0.6437, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||: 76%|#######5 | 72/95 [00:47<00:14, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9571, LAS: 0.9170, UEM: 0.6505, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4361, partial_loss/deprel_loss: 0.4849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.6436, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||: 80%|######## | 76/95 [00:49<00:12, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9567, LAS: 0.9166, UEM: 0.6428, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.6456, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||: 84%|########4 | 80/95 [00:52<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9566, LAS: 0.9165, UEM: 0.6422, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2938, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.6467, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||: 88%|########8 | 84/95 [00:54<00:07, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9566, LAS: 0.9164, UEM: 0.6409, LEM: 0.4035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7118, partial_loss/deprel_loss: 0.6359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8538, loss: 0.6471, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||: 93%|#########2| 88/95 [00:57<00:04, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9569, LAS: 0.9167, UEM: 0.6413, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2269, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.6463, batch_reg_loss: 0.2027, reg_loss: 0.2029 ||: 97%|#########6| 92/95 [01:00<00:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9575, LAS: 0.9173, UEM: 0.6502, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3807, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6188, loss: 0.6419, batch_reg_loss: 0.2027, reg_loss: 0.2029 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 01:09:07,080 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:09:07,080 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - reg_loss | 0.203 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UEM | 0.650 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LEM | 0.412 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EM | 0.924 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.381 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.425 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - loss | 0.642 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LAS | 0.917 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:09:07,082 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:07,082 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:07,086 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:09:11,880 - INFO - combo.training.trainer - Epoch duration: 0:01:10.320997\n", + "2023-04-07 01:09:11,881 - INFO - combo.training.trainer - Estimated training time remaining: 5:14:22\n", + "2023-04-07 01:09:11,881 - INFO - allennlp.training.trainer - Epoch 123/399\n", + "2023-04-07 01:09:11,881 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:09:11,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:09:11,892 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9522, LAS: 0.9148, UEM: 0.3620, LEM: 0.1128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4884, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.6508, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||: 3%|3 | 3/95 [00:02<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9526, LAS: 0.9140, UEM: 0.4789, LEM: 0.2115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1629, partial_loss/deprel_loss: 0.3631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5257, loss: 0.6626, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||: 6%|6 | 6/95 [00:04<01:06, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9574, LAS: 0.9187, UEM: 0.5721, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6244, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||: 9%|9 | 9/95 [00:06<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9548, LAS: 0.9155, UEM: 0.5731, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5578, partial_loss/deprel_loss: 0.6007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7948, loss: 0.6512, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||: 13%|#2 | 12/95 [00:09<01:03, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9550, LAS: 0.9159, UEM: 0.5895, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5842, partial_loss/deprel_loss: 0.5232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7381, loss: 0.6500, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||: 16%|#5 | 15/95 [00:11<01:01, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9543, LAS: 0.9144, UEM: 0.5722, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3629, partial_loss/deprel_loss: 0.3955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5917, loss: 0.6535, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 19%|#8 | 18/95 [00:13<00:57, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9538, LAS: 0.9140, UEM: 0.5603, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3997, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.6544, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 23%|##3 | 22/95 [00:15<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9542, LAS: 0.9148, UEM: 0.5804, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6433, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7302, loss: 0.6507, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 27%|##7 | 26/95 [00:18<00:46, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9548, LAS: 0.9153, UEM: 0.5932, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.5432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7341, loss: 0.6479, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 31%|### | 29/95 [00:20<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9553, LAS: 0.9154, UEM: 0.5956, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5195, loss: 0.6472, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 34%|###3 | 32/95 [00:22<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9560, LAS: 0.9162, UEM: 0.6137, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.6398, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||: 37%|###6 | 35/95 [00:25<00:43, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9567, LAS: 0.9168, UEM: 0.6190, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4259, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.6367, batch_reg_loss: 0.2026, reg_loss: 0.2026 ||: 40%|#### | 38/95 [00:27<00:41, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9576, LAS: 0.9179, UEM: 0.6319, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1669, partial_loss/deprel_loss: 0.2997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4757, loss: 0.6291, batch_reg_loss: 0.2026, reg_loss: 0.2026 ||: 43%|####3 | 41/95 [00:29<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9573, LAS: 0.9176, UEM: 0.6268, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.5440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7702, loss: 0.6318, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 46%|####6 | 44/95 [00:31<00:37, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9581, LAS: 0.9185, UEM: 0.6446, LEM: 0.3997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1093, partial_loss/deprel_loss: 0.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4269, loss: 0.6259, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 49%|####9 | 47/95 [00:33<00:35, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9578, LAS: 0.9183, UEM: 0.6351, LEM: 0.3895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.3295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5234, loss: 0.6274, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 54%|#####3 | 51/95 [00:36<00:31, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9567, LAS: 0.9169, UEM: 0.6282, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3334, partial_loss/deprel_loss: 0.8025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1112, loss: 0.6377, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 57%|#####6 | 54/95 [00:38<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9557, LAS: 0.9158, UEM: 0.6224, LEM: 0.3775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5367, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7300, loss: 0.6446, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 60%|###### | 57/95 [00:40<00:26, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9569, LAS: 0.9172, UEM: 0.6417, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5832, loss: 0.6343, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||: 65%|######5 | 62/95 [00:43<00:20, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9569, LAS: 0.9174, UEM: 0.6374, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6705, partial_loss/deprel_loss: 0.6447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8523, loss: 0.6355, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||: 71%|####### | 67/95 [00:45<00:16, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9559, LAS: 0.9163, UEM: 0.6302, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2689, partial_loss/deprel_loss: 0.8164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1094, loss: 0.6433, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||: 76%|#######5 | 72/95 [00:47<00:12, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9556, LAS: 0.9158, UEM: 0.6252, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2892, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5660, loss: 0.6471, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||: 80%|######## | 76/95 [00:49<00:10, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9563, LAS: 0.9166, UEM: 0.6355, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3708, partial_loss/deprel_loss: 0.4307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6211, loss: 0.6427, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||: 84%|########4 | 80/95 [00:52<00:09, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9561, LAS: 0.9164, UEM: 0.6302, LEM: 0.3872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4902, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7091, loss: 0.6444, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 88%|########8 | 84/95 [00:55<00:07, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9566, LAS: 0.9172, UEM: 0.6456, LEM: 0.4111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2067, partial_loss/deprel_loss: 0.2926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4778, loss: 0.6389, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 93%|#########2| 88/95 [00:59<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9566, LAS: 0.9171, UEM: 0.6438, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5189, loss: 0.6395, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 96%|#########5| 91/95 [01:01<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9569, LAS: 0.9175, UEM: 0.6463, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.4120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6364, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 99%|#########8| 94/95 [01:03<00:00, 1.37it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9571, LAS: 0.9176, UEM: 0.6469, LEM: 0.4097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2050, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.6357, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - reg_loss | 0.203 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - UEM | 0.647 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - LEM | 0.410 | N/A\n", + "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EM | 0.933 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.205 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.404 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - loss | 0.636 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - LAS | 0.918 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:10:19,435 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:10:19,435 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:10:19,440 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:10:24,289 - INFO - combo.training.trainer - Epoch duration: 0:01:12.408076\n", + "2023-04-07 01:10:24,290 - INFO - combo.training.trainer - Estimated training time remaining: 5:13:23\n", + "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - Epoch 124/399\n", + "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:10:24,298 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9765, LAS: 0.9418, UEM: 0.7820, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1438, partial_loss/deprel_loss: 0.3288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.4928, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||: 3%|3 | 3/95 [00:02<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9661, LAS: 0.9291, UEM: 0.7183, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4962, partial_loss/deprel_loss: 0.4507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.5646, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||: 6%|6 | 6/95 [00:04<01:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9637, LAS: 0.9263, UEM: 0.6649, LEM: 0.4202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5642, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.5819, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||: 11%|# | 10/95 [00:06<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9622, LAS: 0.9240, UEM: 0.6498, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1761, partial_loss/deprel_loss: 0.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4628, loss: 0.6004, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||: 14%|#3 | 13/95 [00:08<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9591, LAS: 0.9210, UEM: 0.6203, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8691, partial_loss/deprel_loss: 0.6093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.6202, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||: 17%|#6 | 16/95 [00:11<00:55, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9585, LAS: 0.9200, UEM: 0.6173, LEM: 0.3775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9060, partial_loss/deprel_loss: 0.6450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8995, loss: 0.6287, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 21%|##1 | 20/95 [00:13<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9577, LAS: 0.9189, UEM: 0.6070, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.4049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.6363, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 24%|##4 | 23/95 [00:16<00:51, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9603, LAS: 0.9221, UEM: 0.6962, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0908, partial_loss/deprel_loss: 0.2607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.6100, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 27%|##7 | 26/95 [00:19<00:56, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9596, LAS: 0.9213, UEM: 0.6856, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2466, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5332, loss: 0.6146, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 31%|### | 29/95 [00:21<00:53, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9588, LAS: 0.9204, UEM: 0.6891, LEM: 0.4723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.6208, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 34%|###3 | 32/95 [00:23<00:49, 1.27it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9587, LAS: 0.9200, UEM: 0.6841, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7536, partial_loss/deprel_loss: 0.5833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8195, loss: 0.6237, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 37%|###6 | 35/95 [00:26<00:47, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9590, LAS: 0.9205, UEM: 0.6883, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6676, partial_loss/deprel_loss: 0.5064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7408, loss: 0.6198, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||: 40%|#### | 38/95 [00:28<00:45, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9595, LAS: 0.9206, UEM: 0.6843, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2497, partial_loss/deprel_loss: 0.3926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5662, loss: 0.6188, batch_reg_loss: 0.2022, reg_loss: 0.2022 ||: 44%|####4 | 42/95 [00:31<00:40, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9583, LAS: 0.9195, UEM: 0.6712, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3946, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6381, loss: 0.6288, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 47%|####7 | 45/95 [00:33<00:37, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9589, LAS: 0.9200, UEM: 0.6707, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2488, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5565, loss: 0.6250, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 51%|##### | 48/95 [00:35<00:34, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9582, LAS: 0.9192, UEM: 0.6620, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4370, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6424, loss: 0.6316, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 55%|#####4 | 52/95 [00:38<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9590, LAS: 0.9201, UEM: 0.6630, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5419, loss: 0.6265, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 59%|#####8 | 56/95 [00:40<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9591, LAS: 0.9204, UEM: 0.6680, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5619, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7107, loss: 0.6241, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 63%|######3 | 60/95 [00:43<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9593, LAS: 0.9207, UEM: 0.6668, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4439, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.6225, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 66%|######6 | 63/95 [00:45<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9598, LAS: 0.9211, UEM: 0.6707, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3855, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6277, loss: 0.6206, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 69%|######9 | 66/95 [00:47<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9595, LAS: 0.9208, UEM: 0.6629, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4894, partial_loss/deprel_loss: 0.4298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6225, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||: 73%|#######2 | 69/95 [00:49<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9592, LAS: 0.9206, UEM: 0.6657, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1943, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4963, loss: 0.6230, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||: 77%|#######6 | 73/95 [00:51<00:14, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9583, LAS: 0.9196, UEM: 0.6557, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9570, partial_loss/deprel_loss: 0.6285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.6307, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||: 82%|########2 | 78/95 [00:54<00:10, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9577, LAS: 0.9189, UEM: 0.6487, LEM: 0.4199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6121, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7465, loss: 0.6344, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||: 87%|########7 | 83/95 [00:56<00:06, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9578, LAS: 0.9188, UEM: 0.6475, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4638, partial_loss/deprel_loss: 0.5290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.6341, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||: 93%|#########2| 88/95 [00:59<00:03, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9584, LAS: 0.9194, UEM: 0.6526, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.6302, batch_reg_loss: 0.2020, reg_loss: 0.2021 ||: 97%|#########6| 92/95 [01:02<00:01, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9579, LAS: 0.9188, UEM: 0.6505, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.4896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.6343, batch_reg_loss: 0.2020, reg_loss: 0.2021 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer - reg_loss | 0.202 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UEM | 0.650 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LEM | 0.416 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EM | 0.917 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.377 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.490 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - loss | 0.634 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LAS | 0.919 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:31,296 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:31,299 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:11:35,526 - INFO - combo.training.trainer - Epoch duration: 0:01:11.235946\n", + "2023-04-07 01:11:35,526 - INFO - combo.training.trainer - Estimated training time remaining: 5:12:22\n", + "2023-04-07 01:11:35,526 - INFO - allennlp.training.trainer - Epoch 125/399\n", + "2023-04-07 01:11:35,526 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:11:35,527 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:11:35,534 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9727, LAS: 0.9330, UEM: 0.7624, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2298, partial_loss/deprel_loss: 0.3928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.5460, batch_reg_loss: 0.2020, reg_loss: 0.2020 ||: 3%|3 | 3/95 [00:02<01:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9598, LAS: 0.9199, UEM: 0.6872, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6276, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 6%|6 | 6/95 [00:04<01:10, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9616, LAS: 0.9217, UEM: 0.6680, LEM: 0.3982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6213, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 11%|# | 10/95 [00:07<01:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9636, LAS: 0.9240, UEM: 0.6833, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.5963, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 15%|#4 | 14/95 [00:10<00:59, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9638, LAS: 0.9243, UEM: 0.6749, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6290, loss: 0.5924, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 18%|#7 | 17/95 [00:12<00:58, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9627, LAS: 0.9238, UEM: 0.6518, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4117, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6167, loss: 0.5937, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9643, LAS: 0.9255, UEM: 0.6762, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1209, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4581, loss: 0.5823, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||: 24%|##4 | 23/95 [00:16<00:53, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9662, LAS: 0.9276, UEM: 0.7097, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0926, partial_loss/deprel_loss: 0.2642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4317, loss: 0.5671, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||: 27%|##7 | 26/95 [00:19<00:53, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9650, LAS: 0.9264, UEM: 0.7100, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6103, partial_loss/deprel_loss: 0.5114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7330, loss: 0.5736, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||: 31%|### | 29/95 [00:21<00:51, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9643, LAS: 0.9255, UEM: 0.7037, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3383, partial_loss/deprel_loss: 0.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.5795, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||: 34%|###3 | 32/95 [00:24<00:48, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9626, LAS: 0.9236, UEM: 0.6871, LEM: 0.4382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.5208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7046, loss: 0.5945, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||: 37%|###6 | 35/95 [00:26<00:45, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9622, LAS: 0.9235, UEM: 0.6751, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3145, partial_loss/deprel_loss: 0.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5696, loss: 0.5969, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||: 40%|#### | 38/95 [00:28<00:42, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9708, UAS: 0.9622, LAS: 0.9239, UEM: 0.6983, LEM: 0.4666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0376, partial_loss/deprel_loss: 0.1143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3007, loss: 0.5956, batch_reg_loss: 0.2017, reg_loss: 0.2019 ||: 43%|####3 | 41/95 [00:30<00:41, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9617, LAS: 0.9231, UEM: 0.6876, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.3355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5159, loss: 0.6006, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 47%|####7 | 45/95 [00:33<00:37, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9612, LAS: 0.9227, UEM: 0.6824, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5435, loss: 0.6015, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 52%|#####1 | 49/95 [00:36<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9600, LAS: 0.9214, UEM: 0.6797, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2860, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0190, loss: 0.6081, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 55%|#####4 | 52/95 [00:40<00:39, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9595, LAS: 0.9208, UEM: 0.6774, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7134, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8025, loss: 0.6134, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 58%|#####7 | 55/95 [00:42<00:33, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9597, LAS: 0.9209, UEM: 0.6760, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2389, partial_loss/deprel_loss: 0.3760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5502, loss: 0.6121, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 61%|######1 | 58/95 [00:44<00:29, 1.25it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9596, LAS: 0.9208, UEM: 0.6722, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4008, partial_loss/deprel_loss: 0.3814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.6125, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 65%|######5 | 62/95 [00:46<00:24, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9599, LAS: 0.9212, UEM: 0.6732, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6662, loss: 0.6095, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||: 69%|######9 | 66/95 [00:49<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9597, LAS: 0.9212, UEM: 0.6806, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1058, partial_loss/deprel_loss: 0.2003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3831, loss: 0.6090, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||: 73%|#######2 | 69/95 [00:51<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9598, LAS: 0.9213, UEM: 0.6795, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5656, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7299, loss: 0.6075, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||: 77%|#######6 | 73/95 [00:53<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9588, LAS: 0.9204, UEM: 0.6721, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7029, loss: 0.6140, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||: 81%|########1 | 77/95 [00:56<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9583, LAS: 0.9198, UEM: 0.6638, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7274, partial_loss/deprel_loss: 0.5789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.6188, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||: 85%|########5 | 81/95 [00:59<00:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9584, LAS: 0.9200, UEM: 0.6629, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1167, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.6179, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||: 89%|########9 | 85/95 [01:01<00:06, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9578, LAS: 0.9191, UEM: 0.6565, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6786, partial_loss/deprel_loss: 0.5944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8128, loss: 0.6245, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||: 95%|#########4| 90/95 [01:03<00:02, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9574, LAS: 0.9186, UEM: 0.6510, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6280, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||: 100%|##########| 95/95 [01:06<00:00, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9574, LAS: 0.9186, UEM: 0.6510, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6280, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 01:12:45,128 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9510, LAS: 0.9035, UEM: 0.7940, LEM: 0.6163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0306, partial_loss/deprel_loss: 17.9014, partial_loss/cycle_loss: 0.0000, batch_loss: 14.5273, loss: 9.4725, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9523, LAS: 0.9032, UEM: 0.7358, LEM: 0.5074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1613, partial_loss/deprel_loss: 6.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1312, loss: 10.3144, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:05<00:06, 1.04s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9466, LAS: 0.8957, UEM: 0.6798, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5936, partial_loss/deprel_loss: 8.5089, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9258, loss: 11.1434, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9480, LAS: 0.8973, UEM: 0.6645, LEM: 0.4026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3634, partial_loss/deprel_loss: 8.6906, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0251, loss: 10.1889, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9497, LAS: 0.8995, UEM: 0.6775, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 7.0862, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7547, loss: 9.7858, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.03it/s] \n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - reg_loss | 0.202 | 0.000\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - UEM | 0.651 | 0.677\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - LEM | 0.418 | 0.409\n", + "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EM | 0.936 | 0.922\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.178 | 0.429\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | 0.950\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.335 | 7.086\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - loss | 0.628 | 9.786\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - LAS | 0.919 | 0.899\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:12:55,799 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:13:00,394 - INFO - combo.training.trainer - Epoch duration: 0:01:24.867347\n", + "2023-04-07 01:13:00,394 - INFO - combo.training.trainer - Estimated training time remaining: 5:11:50\n", + "2023-04-07 01:13:00,394 - INFO - allennlp.training.trainer - Epoch 126/399\n", + "2023-04-07 01:13:00,394 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:13:00,395 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:13:00,402 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9772, LAS: 0.9414, UEM: 0.8386, LEM: 0.6353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0986, partial_loss/deprel_loss: 0.1837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3682, loss: 0.4718, batch_reg_loss: 0.2016, reg_loss: 0.2016 ||: 3%|3 | 3/95 [00:02<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9713, LAS: 0.9333, UEM: 0.7912, LEM: 0.5681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.2594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4351, loss: 0.5159, batch_reg_loss: 0.2015, reg_loss: 0.2016 ||: 6%|6 | 6/95 [00:04<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9652, LAS: 0.9277, UEM: 0.7161, LEM: 0.4873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2455, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5626, loss: 0.5609, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||: 11%|# | 10/95 [00:06<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9684, LAS: 0.9322, UEM: 0.7560, LEM: 0.5313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4035, loss: 0.5308, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||: 15%|#4 | 14/95 [00:09<00:54, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9651, LAS: 0.9286, UEM: 0.7391, LEM: 0.5164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1538, partial_loss/deprel_loss: 0.3231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4907, loss: 0.5543, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||: 18%|#7 | 17/95 [00:11<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9648, LAS: 0.9285, UEM: 0.7214, LEM: 0.4970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.5599, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||: 21%|##1 | 20/95 [00:13<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9655, LAS: 0.9289, UEM: 0.7323, LEM: 0.5032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.3889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.5538, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||: 24%|##4 | 23/95 [00:16<00:52, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9658, LAS: 0.9287, UEM: 0.7277, LEM: 0.4930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5463, loss: 0.5550, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 27%|##7 | 26/95 [00:18<00:51, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9655, LAS: 0.9283, UEM: 0.7182, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2810, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5692, loss: 0.5568, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 31%|### | 29/95 [00:20<00:48, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9652, LAS: 0.9283, UEM: 0.7284, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0355, partial_loss/deprel_loss: 0.1220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3061, loss: 0.5586, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 35%|###4 | 33/95 [00:23<00:46, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9636, LAS: 0.9265, UEM: 0.7188, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8579, partial_loss/deprel_loss: 0.5797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8367, loss: 0.5703, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 38%|###7 | 36/95 [00:25<00:43, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9643, LAS: 0.9269, UEM: 0.7215, LEM: 0.4945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1387, partial_loss/deprel_loss: 0.2731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4476, loss: 0.5679, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 41%|####1 | 39/95 [00:28<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9623, LAS: 0.9248, UEM: 0.7082, LEM: 0.4834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3996, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0902, loss: 0.5859, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||: 44%|####4 | 42/95 [00:30<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9614, LAS: 0.9236, UEM: 0.6933, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8482, partial_loss/deprel_loss: 0.6434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8857, loss: 0.5937, batch_reg_loss: 0.2013, reg_loss: 0.2015 ||: 48%|####8 | 46/95 [00:32<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9623, LAS: 0.9244, UEM: 0.7066, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1985, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.5878, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 52%|#####1 | 49/95 [00:34<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9618, LAS: 0.9238, UEM: 0.7034, LEM: 0.4771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6143, partial_loss/deprel_loss: 0.5572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7699, loss: 0.5918, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 55%|#####4 | 52/95 [00:37<00:31, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9615, LAS: 0.9233, UEM: 0.6965, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.3667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5971, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 59%|#####8 | 56/95 [00:39<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9609, LAS: 0.9227, UEM: 0.6897, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5770, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.5998, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 63%|######3 | 60/95 [00:42<00:23, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9600, LAS: 0.9217, UEM: 0.6836, LEM: 0.4567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3667, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.6066, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 67%|######7 | 64/95 [00:44<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9586, LAS: 0.9201, UEM: 0.6741, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5645, partial_loss/deprel_loss: 0.4994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.6182, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 72%|#######1 | 68/95 [00:47<00:18, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9581, LAS: 0.9196, UEM: 0.6668, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6667, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7827, loss: 0.6209, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 76%|#######5 | 72/95 [00:49<00:15, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9575, LAS: 0.9190, UEM: 0.6594, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5403, partial_loss/deprel_loss: 0.4920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7029, loss: 0.6248, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 80%|######## | 76/95 [00:52<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9580, LAS: 0.9195, UEM: 0.6659, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3179, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5655, loss: 0.6214, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||: 84%|########4 | 80/95 [00:55<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9579, LAS: 0.9194, UEM: 0.6578, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6261, loss: 0.6225, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||: 89%|########9 | 85/95 [00:58<00:06, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9581, LAS: 0.9196, UEM: 0.6574, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2276, partial_loss/deprel_loss: 0.2833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4734, loss: 0.6205, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||: 94%|#########3| 89/95 [01:00<00:03, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9579, LAS: 0.9195, UEM: 0.6501, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4741, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.6220, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||: 98%|#########7| 93/95 [01:02<00:01, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9576, LAS: 0.9191, UEM: 0.6473, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9417, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8535, loss: 0.6244, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - reg_loss | 0.201 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - UEM | 0.647 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - LEM | 0.419 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EM | 0.883 | N/A\n", + "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.942 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.580 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - loss | 0.624 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - LAS | 0.919 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:14:07,179 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:14:12,486 - INFO - combo.training.trainer - Epoch duration: 0:01:12.091447\n", + "2023-04-07 01:14:12,486 - INFO - combo.training.trainer - Estimated training time remaining: 5:10:50\n", + "2023-04-07 01:14:12,486 - INFO - allennlp.training.trainer - Epoch 127/399\n", + "2023-04-07 01:14:12,487 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:14:12,487 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:14:12,497 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9739, LAS: 0.9382, UEM: 0.7630, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2674, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5111, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||: 4%|4 | 4/95 [00:02<00:45, 1.98it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9681, LAS: 0.9307, UEM: 0.7433, LEM: 0.4810, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1699, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.5487, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||: 8%|8 | 8/95 [00:05<00:50, 1.71it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9642, LAS: 0.9272, UEM: 0.7015, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2023, partial_loss/deprel_loss: 0.3681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.5721, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||: 12%|#1 | 11/95 [00:07<00:52, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9613, LAS: 0.9238, UEM: 0.6804, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5743, partial_loss/deprel_loss: 0.5249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.5969, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||: 16%|#5 | 15/95 [00:09<00:50, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9621, LAS: 0.9246, UEM: 0.6907, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5297, loss: 0.5854, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||: 19%|#8 | 18/95 [00:12<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9650, LAS: 0.9283, UEM: 0.7494, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0463, partial_loss/deprel_loss: 0.1296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3141, loss: 0.5614, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||: 22%|##2 | 21/95 [00:14<00:55, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9650, LAS: 0.9281, UEM: 0.7352, LEM: 0.5033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5185, loss: 0.5639, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||: 26%|##6 | 25/95 [00:17<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9653, LAS: 0.9285, UEM: 0.7276, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2053, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.5639, batch_reg_loss: 0.2011, reg_loss: 0.2011 ||: 31%|### | 29/95 [00:19<00:44, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9656, LAS: 0.9284, UEM: 0.7280, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.4142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5948, loss: 0.5647, batch_reg_loss: 0.2011, reg_loss: 0.2011 ||: 34%|###3 | 32/95 [00:21<00:42, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9645, LAS: 0.9272, UEM: 0.7129, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1832, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5741, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||: 38%|###7 | 36/95 [00:24<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9649, LAS: 0.9274, UEM: 0.7101, LEM: 0.4685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3522, partial_loss/deprel_loss: 0.4360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6202, loss: 0.5739, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||: 41%|####1 | 39/95 [00:26<00:39, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9654, LAS: 0.9278, UEM: 0.7141, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.4392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6216, loss: 0.5726, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||: 44%|####4 | 42/95 [00:28<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9647, LAS: 0.9272, UEM: 0.7092, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1644, partial_loss/deprel_loss: 0.2823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5752, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||: 48%|####8 | 46/95 [00:31<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9630, LAS: 0.9255, UEM: 0.7011, LEM: 0.4610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5878, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||: 52%|#####1 | 49/95 [00:33<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9631, LAS: 0.9255, UEM: 0.7005, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1052, partial_loss/deprel_loss: 0.2660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4348, loss: 0.5863, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||: 56%|#####5 | 53/95 [00:36<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9629, LAS: 0.9252, UEM: 0.6964, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1875, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4619, loss: 0.5870, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||: 60%|###### | 57/95 [00:39<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9625, LAS: 0.9246, UEM: 0.6915, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.4287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5924, loss: 0.5919, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||: 64%|######4 | 61/95 [00:42<00:23, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9619, LAS: 0.9241, UEM: 0.6864, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5492, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.5949, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||: 67%|######7 | 64/95 [00:44<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9606, LAS: 0.9227, UEM: 0.6774, LEM: 0.4413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7253, partial_loss/deprel_loss: 0.5621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.6048, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||: 71%|####### | 67/95 [00:46<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9610, LAS: 0.9228, UEM: 0.6762, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5750, loss: 0.6024, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9600, LAS: 0.9219, UEM: 0.6669, LEM: 0.4278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7751, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8324, loss: 0.6088, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||: 79%|#######8 | 75/95 [00:51<00:13, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9601, LAS: 0.9222, UEM: 0.6717, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5031, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7030, loss: 0.6068, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||: 83%|########3 | 79/95 [00:54<00:11, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9590, LAS: 0.9210, UEM: 0.6638, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1759, partial_loss/deprel_loss: 0.7507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0366, loss: 0.6173, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 86%|########6 | 82/95 [00:56<00:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9586, LAS: 0.9206, UEM: 0.6571, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3880, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.6197, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 89%|########9 | 85/95 [00:59<00:07, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9586, LAS: 0.9205, UEM: 0.6572, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6085, partial_loss/deprel_loss: 0.5601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6196, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 93%|#########2| 88/95 [01:01<00:05, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9593, LAS: 0.9212, UEM: 0.6665, LEM: 0.4321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0789, partial_loss/deprel_loss: 0.2412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.6155, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 97%|#########6| 92/95 [01:04<00:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9590, LAS: 0.9209, UEM: 0.6612, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3630, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.6174, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n", + "2023-04-07 01:15:21,660 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - reg_loss | 0.201 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UEM | 0.661 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - LEM | 0.427 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EM | 0.926 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.363 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.395 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - loss | 0.617 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - LAS | 0.921 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:21,667 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:15:26,676 - INFO - combo.training.trainer - Epoch duration: 0:01:14.189760\n", + "2023-04-07 01:15:26,677 - INFO - combo.training.trainer - Estimated training time remaining: 5:09:54\n", + "2023-04-07 01:15:26,677 - INFO - allennlp.training.trainer - Epoch 128/399\n", + "2023-04-07 01:15:26,677 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:15:26,678 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:15:26,688 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9631, LAS: 0.9239, UEM: 0.6215, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5215, loss: 0.5860, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||: 3%|3 | 3/95 [00:02<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9607, LAS: 0.9213, UEM: 0.6019, LEM: 0.3412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1463, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4853, loss: 0.6123, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||: 7%|7 | 7/95 [00:04<00:57, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9596, LAS: 0.9208, UEM: 0.6229, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4060, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.6096, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||: 13%|#2 | 12/95 [00:06<00:49, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9572, LAS: 0.9186, UEM: 0.6252, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5571, partial_loss/deprel_loss: 0.4929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.6281, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||: 17%|#6 | 16/95 [00:08<00:45, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9584, LAS: 0.9201, UEM: 0.6581, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0955, partial_loss/deprel_loss: 0.2614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.6133, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||: 22%|##2 | 21/95 [00:11<00:41, 1.80it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9592, LAS: 0.9209, UEM: 0.6667, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3006, partial_loss/deprel_loss: 0.4103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.6094, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||: 26%|##6 | 25/95 [00:13<00:40, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9610, LAS: 0.9231, UEM: 0.6955, LEM: 0.4624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2267, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5951, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||: 31%|### | 29/95 [00:16<00:40, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9602, LAS: 0.9222, UEM: 0.6792, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3083, partial_loss/deprel_loss: 0.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.6033, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||: 35%|###4 | 33/95 [00:19<00:39, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9596, LAS: 0.9220, UEM: 0.6778, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.6060, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||: 39%|###8 | 37/95 [00:22<00:38, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9593, LAS: 0.9215, UEM: 0.6763, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.6038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.6095, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 43%|####3 | 41/95 [00:24<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9597, LAS: 0.9218, UEM: 0.6778, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4898, loss: 0.6066, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 46%|####6 | 44/95 [00:27<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9589, LAS: 0.9205, UEM: 0.6627, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6611, partial_loss/deprel_loss: 0.5736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7917, loss: 0.6158, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 51%|##### | 48/95 [00:29<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9577, LAS: 0.9195, UEM: 0.6543, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2906, partial_loss/deprel_loss: 0.3542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5421, loss: 0.6220, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 54%|#####3 | 51/95 [00:31<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9582, LAS: 0.9200, UEM: 0.6520, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1726, partial_loss/deprel_loss: 0.2786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.6194, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 57%|#####6 | 54/95 [00:33<00:28, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9581, LAS: 0.9200, UEM: 0.6490, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6074, partial_loss/deprel_loss: 0.5364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7512, loss: 0.6199, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 60%|###### | 57/95 [00:36<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9582, LAS: 0.9202, UEM: 0.6509, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2521, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.6191, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 63%|######3 | 60/95 [00:38<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9583, LAS: 0.9202, UEM: 0.6537, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3821, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6607, loss: 0.6180, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 66%|######6 | 63/95 [00:40<00:23, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9579, LAS: 0.9197, UEM: 0.6464, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7458, partial_loss/deprel_loss: 0.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8320, loss: 0.6227, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 69%|######9 | 66/95 [00:42<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9579, LAS: 0.9197, UEM: 0.6427, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.3035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4836, loss: 0.6232, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||: 73%|#######2 | 69/95 [00:44<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9574, LAS: 0.9192, UEM: 0.6365, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3333, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.6278, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||: 77%|#######6 | 73/95 [00:47<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9570, LAS: 0.9188, UEM: 0.6392, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1122, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4062, loss: 0.6284, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||: 81%|########1 | 77/95 [00:49<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9188, UEM: 0.6399, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.6296, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||: 84%|########4 | 80/95 [00:52<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9574, LAS: 0.9193, UEM: 0.6407, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2936, partial_loss/deprel_loss: 0.4140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5905, loss: 0.6260, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||: 88%|########8 | 84/95 [00:54<00:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9582, LAS: 0.9201, UEM: 0.6564, LEM: 0.4279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3467, partial_loss/deprel_loss: 0.3845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.6202, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||: 93%|#########2| 88/95 [00:57<00:04, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9585, LAS: 0.9203, UEM: 0.6591, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4352, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7046, loss: 0.6176, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||: 97%|#########6| 92/95 [00:59<00:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9582, LAS: 0.9201, UEM: 0.6531, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5036, partial_loss/deprel_loss: 0.5400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7332, loss: 0.6198, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - reg_loss | 0.201 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - UEM | 0.653 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - LEM | 0.422 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EM | 0.897 | N/A\n", + "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.504 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.540 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - loss | 0.620 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - LAS | 0.920 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:31,058 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:16:35,283 - INFO - combo.training.trainer - Epoch duration: 0:01:08.605642\n", + "2023-04-07 01:16:35,283 - INFO - combo.training.trainer - Estimated training time remaining: 5:08:46\n", + "2023-04-07 01:16:35,283 - INFO - allennlp.training.trainer - Epoch 129/399\n", + "2023-04-07 01:16:35,283 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:16:35,284 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:16:35,293 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9487, LAS: 0.9084, UEM: 0.4551, LEM: 0.2244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6219, partial_loss/deprel_loss: 0.5310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7497, loss: 0.7101, batch_reg_loss: 0.2005, reg_loss: 0.2005 ||: 3%|3 | 3/95 [00:02<01:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9595, LAS: 0.9227, UEM: 0.5622, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1934, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5250, loss: 0.6236, batch_reg_loss: 0.2004, reg_loss: 0.2005 ||: 7%|7 | 7/95 [00:04<00:57, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9568, LAS: 0.9193, UEM: 0.6007, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6336, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||: 11%|# | 10/95 [00:06<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9604, LAS: 0.9228, UEM: 0.6565, LEM: 0.4014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1986, partial_loss/deprel_loss: 0.3299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5041, loss: 0.6059, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||: 14%|#3 | 13/95 [00:09<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9605, LAS: 0.9228, UEM: 0.6833, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4336, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.6044, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||: 17%|#6 | 16/95 [00:11<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9621, LAS: 0.9241, UEM: 0.6955, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5454, loss: 0.5916, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||: 20%|## | 19/95 [00:13<00:55, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9618, LAS: 0.9234, UEM: 0.6882, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1866, partial_loss/deprel_loss: 0.3131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5959, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||: 23%|##3 | 22/95 [00:15<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9617, LAS: 0.9238, UEM: 0.6714, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.4234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.5981, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 28%|##8 | 27/95 [00:17<00:43, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9605, LAS: 0.9225, UEM: 0.6491, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3813, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5994, loss: 0.6075, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 34%|###3 | 32/95 [00:20<00:37, 1.66it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9600, LAS: 0.9222, UEM: 0.6444, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2141, partial_loss/deprel_loss: 0.3387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.6112, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 39%|###8 | 37/95 [00:22<00:32, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9600, LAS: 0.9222, UEM: 0.6411, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.6134, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 44%|####4 | 42/95 [00:25<00:28, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9594, LAS: 0.9214, UEM: 0.6397, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8439, partial_loss/deprel_loss: 0.5619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8186, loss: 0.6150, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 48%|####8 | 46/95 [00:28<00:29, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9606, LAS: 0.9228, UEM: 0.6704, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6069, loss: 0.6046, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||: 53%|#####2 | 50/95 [00:31<00:30, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9603, LAS: 0.9223, UEM: 0.6629, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1744, partial_loss/deprel_loss: 0.3334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.6073, batch_reg_loss: 0.2002, reg_loss: 0.2004 ||: 57%|#####6 | 54/95 [00:34<00:26, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9609, LAS: 0.9229, UEM: 0.6689, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1728, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.6016, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 61%|######1 | 58/95 [00:36<00:24, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9605, LAS: 0.9227, UEM: 0.6625, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.3101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5079, loss: 0.6039, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 65%|######5 | 62/95 [00:39<00:21, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9603, LAS: 0.9224, UEM: 0.6588, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4922, partial_loss/deprel_loss: 0.5550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.6062, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 69%|######9 | 66/95 [00:42<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9606, LAS: 0.9228, UEM: 0.6639, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3517, partial_loss/deprel_loss: 0.4263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6116, loss: 0.6030, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 73%|#######2 | 69/95 [00:44<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9603, LAS: 0.9225, UEM: 0.6559, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6056, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.6070, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 76%|#######5 | 72/95 [00:46<00:16, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9601, LAS: 0.9222, UEM: 0.6523, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4340, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.6086, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 79%|#######8 | 75/95 [00:49<00:15, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9603, LAS: 0.9224, UEM: 0.6567, LEM: 0.4222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1000, partial_loss/deprel_loss: 0.2497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4199, loss: 0.6076, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 82%|########2 | 78/95 [00:51<00:12, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9599, LAS: 0.9220, UEM: 0.6516, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2894, partial_loss/deprel_loss: 0.3204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.6095, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||: 86%|########6 | 82/95 [00:53<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9592, LAS: 0.9214, UEM: 0.6509, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4873, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6590, loss: 0.6129, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 89%|########9 | 85/95 [00:56<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9593, LAS: 0.9216, UEM: 0.6544, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0975, partial_loss/deprel_loss: 0.2299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4035, loss: 0.6113, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 93%|#########2| 88/95 [00:58<00:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9585, LAS: 0.9207, UEM: 0.6479, LEM: 0.4169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1383, partial_loss/deprel_loss: 0.6807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9724, loss: 0.6168, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 96%|#########5| 91/95 [01:00<00:02, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9586, LAS: 0.9208, UEM: 0.6522, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9341, partial_loss/deprel_loss: 0.6648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9187, loss: 0.6163, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 99%|#########8| 94/95 [01:02<00:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9587, LAS: 0.9209, UEM: 0.6532, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5373, loss: 0.6154, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - reg_loss | 0.200 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - UEM | 0.653 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - LEM | 0.422 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EM | 0.929 | N/A\n", + "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.211 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.369 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - loss | 0.615 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - LAS | 0.921 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:17:42,136 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:17:47,046 - INFO - combo.training.trainer - Epoch duration: 0:01:11.763142\n", + "2023-04-07 01:17:47,047 - INFO - combo.training.trainer - Estimated training time remaining: 5:07:45\n", + "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - Epoch 130/399\n", + "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:17:47,055 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9790, LAS: 0.9467, UEM: 0.8767, LEM: 0.7108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1059, partial_loss/deprel_loss: 0.2329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4076, loss: 0.4231, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||: 3%|3 | 3/95 [00:02<01:13, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9716, LAS: 0.9350, UEM: 0.7807, LEM: 0.5725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4357, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6780, loss: 0.5086, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||: 7%|7 | 7/95 [00:05<01:07, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9682, LAS: 0.9306, UEM: 0.7316, LEM: 0.5186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.5421, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||: 11%|# | 10/95 [00:07<01:04, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9620, LAS: 0.9238, UEM: 0.7156, LEM: 0.5068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2515, partial_loss/deprel_loss: 0.7855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0787, loss: 0.5891, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||: 14%|#3 | 13/95 [00:09<01:03, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9610, LAS: 0.9234, UEM: 0.6973, LEM: 0.4832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5205, loss: 0.5968, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||: 17%|#6 | 16/95 [00:11<00:59, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9626, LAS: 0.9249, UEM: 0.6968, LEM: 0.4707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1997, partial_loss/deprel_loss: 0.3292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5830, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 20%|## | 19/95 [00:13<00:55, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9620, LAS: 0.9240, UEM: 0.6781, LEM: 0.4459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5423, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7048, loss: 0.5941, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 24%|##4 | 23/95 [00:16<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9593, LAS: 0.9211, UEM: 0.6633, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.4034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.6109, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 28%|##8 | 27/95 [00:18<00:45, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9597, LAS: 0.9215, UEM: 0.6719, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.5457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7553, loss: 0.6088, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 32%|###1 | 30/95 [00:21<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9605, LAS: 0.9221, UEM: 0.6805, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5358, partial_loss/deprel_loss: 0.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7040, loss: 0.6035, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 35%|###4 | 33/95 [00:23<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9608, LAS: 0.9222, UEM: 0.6809, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6867, partial_loss/deprel_loss: 0.5800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8013, loss: 0.6046, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||: 38%|###7 | 36/95 [00:25<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9597, LAS: 0.9208, UEM: 0.6796, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6576, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7880, loss: 0.6127, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||: 42%|####2 | 40/95 [00:27<00:35, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9605, LAS: 0.9216, UEM: 0.6810, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3295, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5839, loss: 0.6071, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||: 47%|####7 | 45/95 [00:29<00:29, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9609, LAS: 0.9219, UEM: 0.6751, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2667, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5780, loss: 0.6060, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||: 53%|#####2 | 50/95 [00:31<00:24, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9603, LAS: 0.9211, UEM: 0.6737, LEM: 0.4332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4861, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6114, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 57%|#####6 | 54/95 [00:33<00:22, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9599, LAS: 0.9210, UEM: 0.6660, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4030, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6325, loss: 0.6132, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 61%|######1 | 58/95 [00:36<00:20, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9606, LAS: 0.9218, UEM: 0.6709, LEM: 0.4270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2830, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5605, loss: 0.6065, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 65%|######5 | 62/95 [00:39<00:19, 1.68it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9600, LAS: 0.9212, UEM: 0.6656, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.6111, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 69%|######9 | 66/95 [00:42<00:19, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9605, LAS: 0.9219, UEM: 0.6708, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1165, partial_loss/deprel_loss: 0.2782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.6058, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 74%|#######3 | 70/95 [00:45<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9596, LAS: 0.9209, UEM: 0.6613, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9136, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8392, loss: 0.6117, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 78%|#######7 | 74/95 [00:47<00:13, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9597, LAS: 0.9210, UEM: 0.6599, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4612, loss: 0.6109, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||: 82%|########2 | 78/95 [00:50<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9593, LAS: 0.9207, UEM: 0.6565, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6489, partial_loss/deprel_loss: 0.5137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.6117, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 86%|########6 | 82/95 [00:53<00:09, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9596, LAS: 0.9210, UEM: 0.6572, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.6099, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 89%|########9 | 85/95 [00:56<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9592, LAS: 0.9206, UEM: 0.6511, LEM: 0.4111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.4810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.6140, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 94%|#########3| 89/95 [00:58<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9595, LAS: 0.9209, UEM: 0.6614, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0337, partial_loss/deprel_loss: 0.1437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3215, loss: 0.6122, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 97%|#########6| 92/95 [01:00<00:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9592, LAS: 0.9206, UEM: 0.6562, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5121, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.6141, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 100%|##########| 95/95 [01:03<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9592, LAS: 0.9206, UEM: 0.6562, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5121, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.6141, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 01:18:53,395 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9522, LAS: 0.9051, UEM: 0.8053, LEM: 0.6314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 5.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3104, loss: 8.7662, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.09s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9489, LAS: 0.9015, UEM: 0.7739, LEM: 0.5648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5831, partial_loss/deprel_loss: 21.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 17.7727, loss: 10.0723, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:04<00:07, 1.12s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9504, LAS: 0.9011, UEM: 0.7239, LEM: 0.4769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3935, partial_loss/deprel_loss: 6.7236, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4576, loss: 9.6231, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.08s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9502, LAS: 0.9006, UEM: 0.6871, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0650, partial_loss/deprel_loss: 9.9326, partial_loss/cycle_loss: 0.0000, batch_loss: 8.1591, loss: 9.1834, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:10<00:01, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9512, LAS: 0.9009, UEM: 0.6878, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4606, partial_loss/deprel_loss: 8.6600, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0201, loss: 8.9867, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00, 1.01s/it]\n", + "2023-04-07 01:19:04,558 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:19:04,558 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - reg_loss | 0.200 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UEM | 0.656 | 0.688\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LEM | 0.423 | 0.415\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EM | 0.909 | 0.903\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.512 | 0.461\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | 0.951\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.467 | 8.660\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - loss | 0.614 | 8.987\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LAS | 0.921 | 0.901\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:19:04,564 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:19:09,248 - INFO - combo.training.trainer - Epoch duration: 0:01:22.200925\n", + "2023-04-07 01:19:09,248 - INFO - combo.training.trainer - Estimated training time remaining: 5:07:05\n", + "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - Epoch 131/399\n", + "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:19:09,259 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9535, LAS: 0.9158, UEM: 0.5011, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4068, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.6570, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||: 4%|4 | 4/95 [00:02<00:55, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9538, LAS: 0.9153, UEM: 0.5257, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4342, partial_loss/deprel_loss: 0.5154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6989, loss: 0.6594, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||: 8%|8 | 8/95 [00:04<00:52, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9604, LAS: 0.9219, UEM: 0.6755, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.6061, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||: 12%|#1 | 11/95 [00:07<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9596, LAS: 0.9214, UEM: 0.6476, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4787, partial_loss/deprel_loss: 0.4810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.6183, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||: 15%|#4 | 14/95 [00:09<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9558, LAS: 0.9178, UEM: 0.5973, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9191, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8531, loss: 0.6437, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||: 19%|#8 | 18/95 [00:11<00:50, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9582, LAS: 0.9205, UEM: 0.6412, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4812, loss: 0.6236, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||: 22%|##2 | 21/95 [00:14<00:51, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9574, LAS: 0.9199, UEM: 0.6314, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6610, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7047, loss: 0.6270, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||: 26%|##6 | 25/95 [00:16<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9572, LAS: 0.9199, UEM: 0.6175, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.6262, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||: 31%|### | 29/95 [00:19<00:42, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9579, LAS: 0.9208, UEM: 0.6278, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.6206, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||: 34%|###3 | 32/95 [00:21<00:42, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9596, LAS: 0.9229, UEM: 0.6748, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.4496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6307, loss: 0.6067, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||: 37%|###6 | 35/95 [00:23<00:44, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9596, LAS: 0.9226, UEM: 0.6779, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8268, loss: 0.6067, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||: 41%|####1 | 39/95 [00:26<00:38, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9594, LAS: 0.9223, UEM: 0.6655, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8453, partial_loss/deprel_loss: 0.5137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7797, loss: 0.6100, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 46%|####6 | 44/95 [00:28<00:31, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9581, LAS: 0.9209, UEM: 0.6483, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0519, partial_loss/deprel_loss: 0.5943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8854, loss: 0.6173, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 52%|#####1 | 49/95 [00:30<00:26, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9574, LAS: 0.9203, UEM: 0.6443, LEM: 0.4240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1752, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4578, loss: 0.6196, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 56%|#####5 | 53/95 [00:33<00:23, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9578, LAS: 0.9204, UEM: 0.6455, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6243, partial_loss/deprel_loss: 0.5155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7368, loss: 0.6177, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 60%|###### | 57/95 [00:35<00:21, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9573, LAS: 0.9199, UEM: 0.6416, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.2771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4552, loss: 0.6219, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 64%|######4 | 61/95 [00:38<00:20, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9586, LAS: 0.9211, UEM: 0.6617, LEM: 0.4350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5252, loss: 0.6137, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 68%|######8 | 65/95 [00:41<00:19, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9583, LAS: 0.9207, UEM: 0.6527, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3263, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.6164, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||: 73%|#######2 | 69/95 [00:44<00:17, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9588, LAS: 0.9213, UEM: 0.6577, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2250, partial_loss/deprel_loss: 0.3399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.6119, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||: 77%|#######6 | 73/95 [00:47<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9587, LAS: 0.9211, UEM: 0.6497, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3552, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.6139, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||: 81%|########1 | 77/95 [00:49<00:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9590, LAS: 0.9215, UEM: 0.6537, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3266, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.6116, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||: 85%|########5 | 81/95 [00:52<00:09, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9594, LAS: 0.9219, UEM: 0.6617, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2208, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.6079, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||: 88%|########8 | 84/95 [00:54<00:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9586, LAS: 0.9211, UEM: 0.6562, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6149, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.6144, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||: 92%|#########1| 87/95 [00:56<00:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9590, LAS: 0.9214, UEM: 0.6612, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5799, loss: 0.6115, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||: 95%|#########4| 90/95 [00:59<00:03, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9591, LAS: 0.9216, UEM: 0.6571, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3742, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5592, loss: 0.6103, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||: 99%|#########8| 94/95 [01:01<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9591, LAS: 0.9216, UEM: 0.6561, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6228, loss: 0.6104, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - reg_loss | 0.200 | N/A\n", + "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UEM | 0.656 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LEM | 0.426 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - EM | 0.920 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.395 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.430 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - loss | 0.610 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:20:14,792 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:20:19,595 - INFO - combo.training.trainer - Epoch duration: 0:01:10.346127\n", + "2023-04-07 01:20:19,595 - INFO - combo.training.trainer - Estimated training time remaining: 5:06:00\n", + "2023-04-07 01:20:19,595 - INFO - allennlp.training.trainer - Epoch 132/399\n", + "2023-04-07 01:20:19,596 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:20:19,596 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:20:19,606 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9726, LAS: 0.9355, UEM: 0.7834, LEM: 0.5588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1801, partial_loss/deprel_loss: 0.3268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.5050, batch_reg_loss: 0.1995, reg_loss: 0.1995 ||: 3%|3 | 3/95 [00:02<01:15, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9665, LAS: 0.9290, UEM: 0.6954, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5365, loss: 0.5598, batch_reg_loss: 0.1994, reg_loss: 0.1995 ||: 6%|6 | 6/95 [00:04<01:11, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9568, LAS: 0.9192, UEM: 0.6097, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6579, partial_loss/deprel_loss: 0.5388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7621, loss: 0.6298, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 9%|9 | 9/95 [00:06<01:06, 1.30it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9581, LAS: 0.9204, UEM: 0.6453, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4929, loss: 0.6212, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 13%|#2 | 12/95 [00:09<01:02, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9562, LAS: 0.9191, UEM: 0.5933, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.4918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.6354, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 17%|#6 | 16/95 [00:11<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9586, LAS: 0.9215, UEM: 0.6436, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1133, partial_loss/deprel_loss: 0.2584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.6159, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 20%|## | 19/95 [00:14<00:59, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9598, LAS: 0.9227, UEM: 0.6414, LEM: 0.4065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2147, partial_loss/deprel_loss: 0.3550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.6056, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 23%|##3 | 22/95 [00:16<00:55, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9595, LAS: 0.9226, UEM: 0.6297, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3931, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5889, loss: 0.6056, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 26%|##6 | 25/95 [00:18<00:53, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9583, LAS: 0.9213, UEM: 0.6171, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7926, partial_loss/deprel_loss: 0.5822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.6173, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||: 29%|##9 | 28/95 [00:21<00:50, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9583, LAS: 0.9213, UEM: 0.6311, LEM: 0.3954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9408, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.6161, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 33%|###2 | 31/95 [00:23<00:48, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9578, LAS: 0.9207, UEM: 0.6404, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4528, loss: 0.6182, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 36%|###5 | 34/95 [00:25<00:46, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9574, LAS: 0.9199, UEM: 0.6286, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6666, loss: 0.6246, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 40%|#### | 38/95 [00:28<00:40, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9572, LAS: 0.9197, UEM: 0.6213, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4091, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.6266, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 43%|####3 | 41/95 [00:30<00:38, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9579, LAS: 0.9202, UEM: 0.6249, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1761, partial_loss/deprel_loss: 0.3662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5274, loss: 0.6225, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 46%|####6 | 44/95 [00:32<00:37, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9579, LAS: 0.9203, UEM: 0.6215, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8664, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.6244, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 51%|##### | 48/95 [00:35<00:33, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9576, LAS: 0.9199, UEM: 0.6289, LEM: 0.3925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1261, partial_loss/deprel_loss: 0.2248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.6267, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 54%|#####3 | 51/95 [00:37<00:31, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9582, LAS: 0.9207, UEM: 0.6301, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5878, partial_loss/deprel_loss: 0.4516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.6213, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||: 59%|#####8 | 56/95 [00:39<00:25, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9578, LAS: 0.9204, UEM: 0.6178, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4879, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6683, loss: 0.6228, batch_reg_loss: 0.1993, reg_loss: 0.1993 ||: 64%|######4 | 61/95 [00:42<00:20, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9581, LAS: 0.9205, UEM: 0.6223, LEM: 0.3820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6060, partial_loss/deprel_loss: 0.4639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6916, loss: 0.6196, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 68%|######8 | 65/95 [00:44<00:18, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9372, UAS: 0.9579, LAS: 0.9202, UEM: 0.6264, LEM: 0.3853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.3032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4794, loss: 0.6218, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 73%|#######2 | 69/95 [00:47<00:15, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9579, LAS: 0.9200, UEM: 0.6206, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4641, partial_loss/deprel_loss: 0.4905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.6241, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 77%|#######6 | 73/95 [00:49<00:13, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9578, LAS: 0.9199, UEM: 0.6231, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1604, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6250, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 81%|########1 | 77/95 [00:51<00:10, 1.69it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9585, LAS: 0.9208, UEM: 0.6421, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.2897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.6171, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 85%|########5 | 81/95 [00:54<00:08, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9587, LAS: 0.9212, UEM: 0.6542, LEM: 0.4252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7923, partial_loss/deprel_loss: 0.5080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.6143, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||: 89%|########9 | 85/95 [00:56<00:06, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9590, LAS: 0.9216, UEM: 0.6569, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2455, partial_loss/deprel_loss: 0.3351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5163, loss: 0.6113, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||: 95%|#########4| 90/95 [00:59<00:02, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9591, LAS: 0.9216, UEM: 0.6544, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.4717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.6107, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||: 99%|#########8| 94/95 [01:01<00:00, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9593, LAS: 0.9218, UEM: 0.6573, LEM: 0.4266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1718, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4596, loss: 0.6091, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - reg_loss | 0.199 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - UEM | 0.657 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - LEM | 0.427 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EM | 0.941 | N/A\n", + "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.172 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.283 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - loss | 0.609 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:21:24,929 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:21:29,084 - INFO - combo.training.trainer - Epoch duration: 0:01:09.488866\n", + "2023-04-07 01:21:29,085 - INFO - combo.training.trainer - Estimated training time remaining: 5:04:54\n", + "2023-04-07 01:21:29,085 - INFO - allennlp.training.trainer - Epoch 133/399\n", + "2023-04-07 01:21:29,085 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:21:29,086 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:21:29,093 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9399, LAS: 0.9028, UEM: 0.2065, LEM: 0.0769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5936, partial_loss/deprel_loss: 0.5406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7503, loss: 0.7376, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||: 3%|3 | 3/95 [00:02<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9539, LAS: 0.9176, UEM: 0.5125, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2040, partial_loss/deprel_loss: 0.3429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5142, loss: 0.6439, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||: 7%|7 | 7/95 [00:04<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9564, LAS: 0.9197, UEM: 0.5869, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1730, partial_loss/deprel_loss: 0.2958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4703, loss: 0.6288, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||: 11%|# | 10/95 [00:06<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9559, LAS: 0.9192, UEM: 0.5592, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3661, partial_loss/deprel_loss: 0.4280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.6349, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||: 15%|#4 | 14/95 [00:09<00:54, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9564, LAS: 0.9201, UEM: 0.5590, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5096, partial_loss/deprel_loss: 0.4017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6224, loss: 0.6229, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||: 18%|#7 | 17/95 [00:11<00:52, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9589, LAS: 0.9226, UEM: 0.5985, LEM: 0.3627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.2514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4407, loss: 0.6044, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||: 22%|##2 | 21/95 [00:13<00:47, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9576, LAS: 0.9207, UEM: 0.6014, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3723, partial_loss/deprel_loss: 0.4805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6579, loss: 0.6190, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||: 25%|##5 | 24/95 [00:15<00:46, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9574, LAS: 0.9211, UEM: 0.5883, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3182, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5365, loss: 0.6163, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||: 28%|##8 | 27/95 [00:17<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9577, LAS: 0.9216, UEM: 0.5975, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1524, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4785, loss: 0.6115, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||: 33%|###2 | 31/95 [00:20<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9586, LAS: 0.9224, UEM: 0.6095, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.2543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.6066, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||: 36%|###5 | 34/95 [00:22<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9574, LAS: 0.9210, UEM: 0.5948, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6901, partial_loss/deprel_loss: 0.5410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7698, loss: 0.6148, batch_reg_loss: 0.1990, reg_loss: 0.1990 ||: 39%|###8 | 37/95 [00:25<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9583, LAS: 0.9223, UEM: 0.6306, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3606, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5224, loss: 0.6058, batch_reg_loss: 0.1990, reg_loss: 0.1990 ||: 42%|####2 | 40/95 [00:27<00:41, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9590, LAS: 0.9227, UEM: 0.6295, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3459, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6169, loss: 0.6030, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 46%|####6 | 44/95 [00:30<00:36, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9228, UEM: 0.6317, LEM: 0.4045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.6015, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 49%|####9 | 47/95 [00:32<00:33, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9593, LAS: 0.9229, UEM: 0.6357, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6555, partial_loss/deprel_loss: 0.5572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7758, loss: 0.6008, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 53%|#####2 | 50/95 [00:34<00:32, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9585, LAS: 0.9220, UEM: 0.6241, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6961, partial_loss/deprel_loss: 0.5424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.6065, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 56%|#####5 | 53/95 [00:36<00:31, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9579, LAS: 0.9214, UEM: 0.6182, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8112, partial_loss/deprel_loss: 0.5747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8209, loss: 0.6116, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 59%|#####8 | 56/95 [00:39<00:29, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9569, LAS: 0.9204, UEM: 0.6100, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6640, loss: 0.6181, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 62%|######2 | 59/95 [00:41<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9569, LAS: 0.9203, UEM: 0.6064, LEM: 0.3807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6156, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7598, loss: 0.6195, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 65%|######5 | 62/95 [00:43<00:25, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9579, LAS: 0.9213, UEM: 0.6329, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0794, partial_loss/deprel_loss: 0.1908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3673, loss: 0.6108, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 68%|######8 | 65/95 [00:46<00:23, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9577, LAS: 0.9212, UEM: 0.6300, LEM: 0.4073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3188, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5700, loss: 0.6126, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 72%|#######1 | 68/95 [00:48<00:21, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9580, LAS: 0.9214, UEM: 0.6344, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4566, partial_loss/deprel_loss: 0.4366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.6101, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||: 75%|#######4 | 71/95 [00:50<00:17, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9579, LAS: 0.9212, UEM: 0.6278, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2838, partial_loss/deprel_loss: 0.3759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.6125, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||: 79%|#######8 | 75/95 [00:53<00:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9580, LAS: 0.9211, UEM: 0.6389, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0798, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4073, loss: 0.6137, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||: 82%|########2 | 78/95 [00:55<00:12, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9574, LAS: 0.9206, UEM: 0.6413, LEM: 0.4196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9004, partial_loss/deprel_loss: 0.6443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8944, loss: 0.6174, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||: 85%|########5 | 81/95 [00:57<00:10, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9580, LAS: 0.9210, UEM: 0.6499, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5478, loss: 0.6142, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||: 89%|########9 | 85/95 [00:59<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9586, LAS: 0.9217, UEM: 0.6566, LEM: 0.4312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1234, partial_loss/deprel_loss: 0.2830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.6101, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||: 94%|#########3| 89/95 [01:02<00:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9588, LAS: 0.9217, UEM: 0.6545, LEM: 0.4263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2995, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5546, loss: 0.6094, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||: 98%|#########7| 93/95 [01:05<00:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9591, LAS: 0.9221, UEM: 0.6580, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.6070, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - reg_loss | 0.199 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - UEM | 0.658 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - LEM | 0.429 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EM | 0.934 | N/A\n", + "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.268 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.330 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - loss | 0.607 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,764 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:22:45,622 - INFO - combo.training.trainer - Epoch duration: 0:01:16.537262\n", + "2023-04-07 01:22:45,623 - INFO - combo.training.trainer - Estimated training time remaining: 5:04:01\n", + "2023-04-07 01:22:45,623 - INFO - allennlp.training.trainer - Epoch 134/399\n", + "2023-04-07 01:22:45,623 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:22:45,624 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:22:45,633 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9587, LAS: 0.9216, UEM: 0.5794, LEM: 0.3084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.6184, batch_reg_loss: 0.1988, reg_loss: 0.1988 ||: 4%|4 | 4/95 [00:02<00:55, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9627, LAS: 0.9254, UEM: 0.6145, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3075, partial_loss/deprel_loss: 0.3267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.5816, batch_reg_loss: 0.1987, reg_loss: 0.1988 ||: 7%|7 | 7/95 [00:04<00:55, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9634, LAS: 0.9266, UEM: 0.6209, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.5769, batch_reg_loss: 0.1987, reg_loss: 0.1988 ||: 12%|#1 | 11/95 [00:06<00:52, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9658, LAS: 0.9284, UEM: 0.6867, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0975, partial_loss/deprel_loss: 0.2502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4184, loss: 0.5614, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||: 16%|#5 | 15/95 [00:09<00:52, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9657, LAS: 0.9285, UEM: 0.6866, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.3317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5615, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||: 20%|## | 19/95 [00:12<00:48, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9659, LAS: 0.9286, UEM: 0.6879, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4217, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.5634, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||: 23%|##3 | 22/95 [00:14<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9638, LAS: 0.9263, UEM: 0.6769, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3697, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.5777, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 26%|##6 | 25/95 [00:16<00:47, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9532, UAS: 0.9637, LAS: 0.9269, UEM: 0.6751, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1453, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4296, loss: 0.5786, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 29%|##9 | 28/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9634, LAS: 0.9266, UEM: 0.6617, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5527, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7243, loss: 0.5815, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 34%|###3 | 32/95 [00:21<00:42, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9643, LAS: 0.9273, UEM: 0.6860, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1710, partial_loss/deprel_loss: 0.2952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4690, loss: 0.5732, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 37%|###6 | 35/95 [00:23<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9637, LAS: 0.9265, UEM: 0.6841, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7499, partial_loss/deprel_loss: 0.6065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8338, loss: 0.5772, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 40%|#### | 38/95 [00:25<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9640, LAS: 0.9269, UEM: 0.6920, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5653, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7277, loss: 0.5742, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 43%|####3 | 41/95 [00:28<00:41, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9645, LAS: 0.9272, UEM: 0.6925, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2804, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.5728, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||: 46%|####6 | 44/95 [00:30<00:38, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9633, LAS: 0.9257, UEM: 0.6906, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3622, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6005, loss: 0.5807, batch_reg_loss: 0.1985, reg_loss: 0.1987 ||: 49%|####9 | 47/95 [00:32<00:36, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9372, UAS: 0.9629, LAS: 0.9254, UEM: 0.6836, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2095, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5069, loss: 0.5827, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||: 54%|#####3 | 51/95 [00:35<00:32, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9625, LAS: 0.9251, UEM: 0.6921, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2024, partial_loss/deprel_loss: 0.3444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.5865, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||: 58%|#####7 | 55/95 [00:38<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9626, LAS: 0.9250, UEM: 0.6952, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.2485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4214, loss: 0.5862, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||: 61%|######1 | 58/95 [00:40<00:27, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9629, LAS: 0.9255, UEM: 0.6956, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3908, partial_loss/deprel_loss: 0.4097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.5823, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||: 65%|######5 | 62/95 [00:43<00:23, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9629, LAS: 0.9255, UEM: 0.6915, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3678, partial_loss/deprel_loss: 0.4048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5824, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||: 68%|######8 | 65/95 [00:45<00:22, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9628, LAS: 0.9254, UEM: 0.6897, LEM: 0.4478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1705, partial_loss/deprel_loss: 0.2590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.5825, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 72%|#######1 | 68/95 [00:48<00:20, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9617, LAS: 0.9244, UEM: 0.6812, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8721, partial_loss/deprel_loss: 0.5912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8458, loss: 0.5900, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 75%|#######4 | 71/95 [00:50<00:17, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9611, LAS: 0.9238, UEM: 0.6721, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7259, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 0.5945, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 78%|#######7 | 74/95 [00:52<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9605, LAS: 0.9232, UEM: 0.6652, LEM: 0.4278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.5349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7612, loss: 0.5999, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 81%|########1 | 77/95 [00:54<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9597, LAS: 0.9227, UEM: 0.6757, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4574, partial_loss/deprel_loss: 0.7380, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0803, loss: 0.6039, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 84%|########4 | 80/95 [00:56<00:11, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9594, LAS: 0.9223, UEM: 0.6720, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 0.6069, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 87%|########7 | 83/95 [00:59<00:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9592, LAS: 0.9219, UEM: 0.6638, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7097, loss: 0.6094, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 92%|#########1| 87/95 [01:01<00:05, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9592, LAS: 0.9218, UEM: 0.6602, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2254, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4847, loss: 0.6093, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 96%|#########5| 91/95 [01:03<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9596, LAS: 0.9221, UEM: 0.6595, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5255, loss: 0.6066, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 100%|##########| 95/95 [01:06<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9596, LAS: 0.9221, UEM: 0.6595, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5255, loss: 0.6066, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - reg_loss | 0.199 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UEM | 0.660 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - LEM | 0.427 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EM | 0.934 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.216 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.355 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - loss | 0.607 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:23:55,494 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:24:00,913 - INFO - combo.training.trainer - Epoch duration: 0:01:15.289828\n", + "2023-04-07 01:24:00,913 - INFO - combo.training.trainer - Estimated training time remaining: 5:03:06\n", + "2023-04-07 01:24:00,913 - INFO - allennlp.training.trainer - Epoch 135/399\n", + "2023-04-07 01:24:00,913 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:24:00,914 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:24:00,924 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9734, LAS: 0.9385, UEM: 0.8424, LEM: 0.6630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5135, partial_loss/deprel_loss: 0.5183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7157, loss: 0.4844, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||: 4%|4 | 4/95 [00:02<00:47, 1.92it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9621, LAS: 0.9262, UEM: 0.7501, LEM: 0.5557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5013, loss: 0.5787, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||: 9%|9 | 9/95 [00:04<00:43, 1.99it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9640, LAS: 0.9268, UEM: 0.7403, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3602, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.5684, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||: 15%|#4 | 14/95 [00:06<00:39, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9642, LAS: 0.9273, UEM: 0.7454, LEM: 0.5255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8161, partial_loss/deprel_loss: 0.5156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7740, loss: 0.5649, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||: 19%|#8 | 18/95 [00:08<00:39, 1.94it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9608, LAS: 0.9236, UEM: 0.7243, LEM: 0.5029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.3806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.5923, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||: 23%|##3 | 22/95 [00:11<00:41, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9598, LAS: 0.9227, UEM: 0.7079, LEM: 0.4870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7618, partial_loss/deprel_loss: 0.5350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7786, loss: 0.5970, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||: 27%|##7 | 26/95 [00:14<00:40, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9609, LAS: 0.9239, UEM: 0.7030, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2092, partial_loss/deprel_loss: 0.3251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5888, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||: 32%|###1 | 30/95 [00:17<00:40, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9599, LAS: 0.9229, UEM: 0.6832, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6985, partial_loss/deprel_loss: 0.5348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7658, loss: 0.5973, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||: 36%|###5 | 34/95 [00:19<00:37, 1.65it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9603, LAS: 0.9235, UEM: 0.6796, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3702, partial_loss/deprel_loss: 0.3774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5742, loss: 0.5939, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||: 40%|#### | 38/95 [00:21<00:34, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9588, LAS: 0.9218, UEM: 0.6668, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.6046, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 44%|####4 | 42/95 [00:24<00:32, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9588, LAS: 0.9219, UEM: 0.6636, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0991, partial_loss/deprel_loss: 0.2442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.6069, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 48%|####8 | 46/95 [00:26<00:30, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9595, LAS: 0.9228, UEM: 0.6722, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1898, partial_loss/deprel_loss: 0.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.6017, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 53%|#####2 | 50/95 [00:30<00:30, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9598, LAS: 0.9230, UEM: 0.6752, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1546, partial_loss/deprel_loss: 0.2717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4465, loss: 0.6022, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 56%|#####5 | 53/95 [00:32<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9602, LAS: 0.9234, UEM: 0.6769, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4765, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.6002, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9599, LAS: 0.9233, UEM: 0.6675, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6918, loss: 0.6008, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 63%|######3 | 60/95 [00:36<00:23, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9588, LAS: 0.9221, UEM: 0.6554, LEM: 0.4282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6334, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7264, loss: 0.6090, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 67%|######7 | 64/95 [00:39<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9593, LAS: 0.9229, UEM: 0.6709, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5367, partial_loss/deprel_loss: 0.4702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.6044, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 71%|####### | 67/95 [00:42<00:20, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9592, LAS: 0.9228, UEM: 0.6741, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.5313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7579, loss: 0.6047, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 74%|#######3 | 70/95 [00:44<00:19, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9593, LAS: 0.9228, UEM: 0.6713, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.6042, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 77%|#######6 | 73/95 [00:46<00:16, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9588, LAS: 0.9222, UEM: 0.6636, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5401, loss: 0.6087, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||: 81%|########1 | 77/95 [00:49<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9591, LAS: 0.9224, UEM: 0.6621, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5417, loss: 0.6078, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||: 84%|########4 | 80/95 [00:51<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9592, LAS: 0.9225, UEM: 0.6615, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4661, partial_loss/deprel_loss: 0.4844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6789, loss: 0.6062, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||: 87%|########7 | 83/95 [00:53<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9591, LAS: 0.9224, UEM: 0.6554, LEM: 0.4328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3490, partial_loss/deprel_loss: 0.4178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.6071, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||: 92%|#########1| 87/95 [00:55<00:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9593, LAS: 0.9226, UEM: 0.6519, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4279, partial_loss/deprel_loss: 0.4535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.6058, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||: 96%|#########5| 91/95 [00:58<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9596, LAS: 0.9228, UEM: 0.6544, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3878, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6518, loss: 0.6035, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||: 99%|#########8| 94/95 [01:00<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9596, LAS: 0.9229, UEM: 0.6572, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.2692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4540, loss: 0.6019, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 01:25:05,849 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9448, LAS: 0.8910, UEM: 0.5697, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5015, partial_loss/deprel_loss: 20.5917, partial_loss/cycle_loss: 0.0000, batch_loss: 16.7736, loss: 10.3735, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:03<00:08, 1.06s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9466, LAS: 0.8907, UEM: 0.5723, LEM: 0.2552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6183, partial_loss/deprel_loss: 7.5705, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1801, loss: 9.4382, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:05, 1.01s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9465, LAS: 0.8924, UEM: 0.5659, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9658, partial_loss/deprel_loss: 9.7527, partial_loss/cycle_loss: 0.0000, batch_loss: 7.9953, loss: 9.4572, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9518, LAS: 0.9006, UEM: 0.6898, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 5.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1963, loss: 8.5575, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9518, LAS: 0.9006, UEM: 0.6898, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 5.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1963, loss: 8.5575, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01it/s]\n", + "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer - reg_loss | 0.198 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UEM | 0.657 | 0.690\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LEM | 0.433 | 0.415\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EM | 0.933 | 0.944\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.203 | 0.208\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | 0.952\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.269 | 5.193\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - loss | 0.602 | 8.557\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LAS | 0.923 | 0.901\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:25:16,785 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:25:16,785 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:25:16,789 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:25:21,507 - INFO - combo.training.trainer - Epoch duration: 0:01:20.593771\n", + "2023-04-07 01:25:21,508 - INFO - combo.training.trainer - Estimated training time remaining: 5:02:20\n", + "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - Epoch 136/399\n", + "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:25:21,519 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9477, LAS: 0.9105, UEM: 0.4170, LEM: 0.1993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.3794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.6688, batch_reg_loss: 0.1981, reg_loss: 0.1981 ||: 5%|5 | 5/95 [00:02<00:41, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9572, LAS: 0.9211, UEM: 0.6111, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6145, partial_loss/deprel_loss: 0.5036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7239, loss: 0.6007, batch_reg_loss: 0.1981, reg_loss: 0.1981 ||: 11%|# | 10/95 [00:04<00:39, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9574, LAS: 0.9199, UEM: 0.6279, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2094, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5212, loss: 0.6057, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||: 16%|#5 | 15/95 [00:06<00:36, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9589, LAS: 0.9215, UEM: 0.6452, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6473, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.5946, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||: 19%|#8 | 18/95 [00:09<00:42, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9589, LAS: 0.9216, UEM: 0.6381, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5630, partial_loss/deprel_loss: 0.4474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6685, loss: 0.5919, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||: 23%|##3 | 22/95 [00:11<00:42, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9592, LAS: 0.9222, UEM: 0.6422, LEM: 0.3934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.3576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5916, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||: 26%|##6 | 25/95 [00:14<00:44, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9570, LAS: 0.9201, UEM: 0.6178, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4075, partial_loss/deprel_loss: 0.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.6105, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||: 31%|### | 29/95 [00:16<00:41, 1.58it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9571, LAS: 0.9201, UEM: 0.6056, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5901, partial_loss/deprel_loss: 0.4912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.6146, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||: 34%|###3 | 32/95 [00:18<00:41, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9567, LAS: 0.9198, UEM: 0.6082, LEM: 0.3685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8884, partial_loss/deprel_loss: 0.6101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8637, loss: 0.6163, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||: 37%|###6 | 35/95 [00:20<00:40, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9573, LAS: 0.9206, UEM: 0.6068, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3104, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5596, loss: 0.6127, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||: 40%|#### | 38/95 [00:23<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9560, UAS: 0.9582, LAS: 0.9216, UEM: 0.6191, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0835, partial_loss/deprel_loss: 0.2134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.6083, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 44%|####4 | 42/95 [00:26<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9590, LAS: 0.9223, UEM: 0.6321, LEM: 0.3934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4743, loss: 0.6025, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 47%|####7 | 45/95 [00:28<00:35, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9560, LAS: 0.9194, UEM: 0.6176, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3761, partial_loss/deprel_loss: 0.7035, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.6228, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 52%|#####1 | 49/95 [00:31<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9568, LAS: 0.9201, UEM: 0.6234, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.6176, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 55%|#####4 | 52/95 [00:33<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8834, UAS: 0.9570, LAS: 0.9205, UEM: 0.6418, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8543, partial_loss/deprel_loss: 0.6344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.6145, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 58%|#####7 | 55/95 [00:35<00:28, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9579, LAS: 0.9214, UEM: 0.6563, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5273, loss: 0.6074, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 61%|######1 | 58/95 [00:37<00:27, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9582, LAS: 0.9217, UEM: 0.6544, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4923, partial_loss/deprel_loss: 0.4504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6567, loss: 0.6058, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 64%|######4 | 61/95 [00:39<00:24, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9589, LAS: 0.9225, UEM: 0.6632, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 0.2583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.6002, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 67%|######7 | 64/95 [00:42<00:23, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9581, LAS: 0.9217, UEM: 0.6515, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7897, partial_loss/deprel_loss: 0.5498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.6060, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 72%|#######1 | 68/95 [00:44<00:19, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9582, LAS: 0.9218, UEM: 0.6451, LEM: 0.4123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3828, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.6069, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||: 76%|#######5 | 72/95 [00:47<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9585, LAS: 0.9220, UEM: 0.6490, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.3631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.6041, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||: 79%|#######8 | 75/95 [00:49<00:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9586, LAS: 0.9220, UEM: 0.6448, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1703, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5059, loss: 0.6055, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||: 83%|########3 | 79/95 [00:52<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9589, LAS: 0.9223, UEM: 0.6472, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 0.4348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6431, loss: 0.6029, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||: 86%|########6 | 82/95 [00:54<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9589, LAS: 0.9222, UEM: 0.6438, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.6042, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 91%|######### | 86/95 [00:57<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9588, LAS: 0.9222, UEM: 0.6445, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4299, partial_loss/deprel_loss: 0.4909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6765, loss: 0.6043, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 94%|#########3| 89/95 [00:59<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9588, LAS: 0.9221, UEM: 0.6399, LEM: 0.4076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5266, partial_loss/deprel_loss: 0.4846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6908, loss: 0.6058, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 97%|#########6| 92/95 [01:03<00:02, 1.13it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9595, LAS: 0.9230, UEM: 0.6589, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1738, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6001, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:05<00:00, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9595, LAS: 0.9230, UEM: 0.6589, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1738, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6001, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - reg_loss | 0.198 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - UEM | 0.659 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - LEM | 0.431 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EM | 0.939 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.174 | N/A\n", + "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.328 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - loss | 0.600 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - LAS | 0.923 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:29,694 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:26:33,709 - INFO - combo.training.trainer - Epoch duration: 0:01:12.201244\n", + "2023-04-07 01:26:33,709 - INFO - combo.training.trainer - Estimated training time remaining: 5:01:18\n", + "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - Epoch 137/399\n", + "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:26:33,718 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9578, LAS: 0.9179, UEM: 0.6403, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8409, partial_loss/deprel_loss: 0.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8582, loss: 0.6337, batch_reg_loss: 0.1978, reg_loss: 0.1978 ||: 4%|4 | 4/95 [00:02<00:56, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9617, LAS: 0.9243, UEM: 0.6554, LEM: 0.3759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2772, partial_loss/deprel_loss: 0.3896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.5891, batch_reg_loss: 0.1977, reg_loss: 0.1978 ||: 8%|8 | 8/95 [00:04<00:54, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9616, LAS: 0.9247, UEM: 0.6517, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.3472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.5920, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||: 13%|#2 | 12/95 [00:07<00:52, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9630, LAS: 0.9263, UEM: 0.6644, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4985, partial_loss/deprel_loss: 0.5145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.5823, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||: 17%|#6 | 16/95 [00:09<00:47, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9618, LAS: 0.9251, UEM: 0.6491, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5085, loss: 0.5885, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||: 22%|##2 | 21/95 [00:11<00:40, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9616, LAS: 0.9249, UEM: 0.6594, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1471, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.5903, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||: 27%|##7 | 26/95 [00:14<00:37, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9591, LAS: 0.9221, UEM: 0.6384, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2336, partial_loss/deprel_loss: 0.7373, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0342, loss: 0.6098, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 33%|###2 | 31/95 [00:17<00:34, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9612, LAS: 0.9247, UEM: 0.6996, LEM: 0.4798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1872, partial_loss/deprel_loss: 0.3673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5289, loss: 0.5921, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 37%|###6 | 35/95 [00:20<00:37, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9609, LAS: 0.9246, UEM: 0.6880, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4530, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6143, loss: 0.5916, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 41%|####1 | 39/95 [00:23<00:36, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9601, LAS: 0.9238, UEM: 0.6744, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8377, partial_loss/deprel_loss: 0.5340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.5982, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 45%|####5 | 43/95 [00:25<00:32, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9594, LAS: 0.9230, UEM: 0.6606, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5927, loss: 0.6032, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 49%|####9 | 47/95 [00:28<00:30, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9600, LAS: 0.9236, UEM: 0.6667, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3820, partial_loss/deprel_loss: 0.4031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5984, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 54%|#####3 | 51/95 [00:30<00:28, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9589, LAS: 0.9223, UEM: 0.6633, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2752, partial_loss/deprel_loss: 0.3877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5628, loss: 0.6049, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||: 58%|#####7 | 55/95 [00:33<00:25, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9590, LAS: 0.9223, UEM: 0.6597, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.6049, batch_reg_loss: 0.1976, reg_loss: 0.1976 ||: 62%|######2 | 59/95 [00:35<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9592, LAS: 0.9223, UEM: 0.6543, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5126, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6555, loss: 0.6051, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 66%|######6 | 63/95 [00:38<00:21, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9601, LAS: 0.9233, UEM: 0.6704, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 0.3038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.5972, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 71%|####### | 67/95 [00:41<00:18, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9599, LAS: 0.9231, UEM: 0.6695, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1581, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4612, loss: 0.5972, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 75%|#######4 | 71/95 [00:44<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9598, LAS: 0.9232, UEM: 0.6675, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5374, loss: 0.5974, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 79%|#######8 | 75/95 [00:46<00:13, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9603, LAS: 0.9235, UEM: 0.6675, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5380, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6997, loss: 0.5962, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 83%|########3 | 79/95 [00:49<00:10, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9597, LAS: 0.9228, UEM: 0.6618, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0778, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9054, loss: 0.6002, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 87%|########7 | 83/95 [00:52<00:08, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9596, LAS: 0.9226, UEM: 0.6607, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7499, loss: 0.6014, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||: 91%|######### | 86/95 [00:54<00:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9594, LAS: 0.9224, UEM: 0.6574, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6314, partial_loss/deprel_loss: 0.5472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7615, loss: 0.6034, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 94%|#########3| 89/95 [00:56<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9598, LAS: 0.9227, UEM: 0.6653, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.6003, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 97%|#########6| 92/95 [00:59<00:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9228, UEM: 0.6633, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.5997, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 100%|##########| 95/95 [01:01<00:00, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9228, UEM: 0.6633, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.5997, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - reg_loss | 0.198 | N/A\n", + "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UEM | 0.663 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LEM | 0.432 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - EM | 0.928 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.321 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.440 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - loss | 0.600 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LAS | 0.923 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:27:38,164 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:27:38,168 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:27:42,897 - INFO - combo.training.trainer - Epoch duration: 0:01:09.187591\n", + "2023-04-07 01:27:42,898 - INFO - combo.training.trainer - Estimated training time remaining: 5:00:10\n", + "2023-04-07 01:27:42,898 - INFO - allennlp.training.trainer - Epoch 138/399\n", + "2023-04-07 01:27:42,898 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:27:42,899 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:27:42,907 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9656, LAS: 0.9287, UEM: 0.6550, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2006, partial_loss/deprel_loss: 0.3173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4914, loss: 0.5460, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 3%|3 | 3/95 [00:02<01:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9685, LAS: 0.9327, UEM: 0.6778, LEM: 0.4097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.5286, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 6%|6 | 6/95 [00:04<01:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9696, UAS: 0.9720, LAS: 0.9371, UEM: 0.7967, LEM: 0.5964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0302, partial_loss/deprel_loss: 0.1199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2994, loss: 0.4928, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 8%|8 | 8/95 [00:06<01:10, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9672, LAS: 0.9314, UEM: 0.7446, LEM: 0.5393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3475, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.5362, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 12%|#1 | 11/95 [00:08<01:05, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9339, UAS: 0.9653, LAS: 0.9291, UEM: 0.7202, LEM: 0.5100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1821, partial_loss/deprel_loss: 0.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4743, loss: 0.5506, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 15%|#4 | 14/95 [00:10<01:01, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9605, LAS: 0.9237, UEM: 0.6877, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5680, partial_loss/deprel_loss: 0.4767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6923, loss: 0.5843, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||: 18%|#7 | 17/95 [00:12<00:58, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9619, LAS: 0.9251, UEM: 0.6909, LEM: 0.4720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.3693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.5734, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9632, LAS: 0.9268, UEM: 0.7058, LEM: 0.4823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1060, partial_loss/deprel_loss: 0.2545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4221, loss: 0.5637, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||: 24%|##4 | 23/95 [00:16<00:51, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9624, LAS: 0.9259, UEM: 0.6856, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7878, partial_loss/deprel_loss: 0.4806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7394, loss: 0.5732, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||: 28%|##8 | 27/95 [00:19<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9623, LAS: 0.9256, UEM: 0.6836, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7151, partial_loss/deprel_loss: 0.5253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7605, loss: 0.5748, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||: 33%|###2 | 31/95 [00:21<00:40, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9614, LAS: 0.9245, UEM: 0.6895, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1021, partial_loss/deprel_loss: 0.2748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4375, loss: 0.5830, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||: 37%|###6 | 35/95 [00:23<00:36, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9606, LAS: 0.9239, UEM: 0.6718, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6038, loss: 0.5886, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||: 41%|####1 | 39/95 [00:26<00:33, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9616, LAS: 0.9249, UEM: 0.6908, LEM: 0.4621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0725, partial_loss/deprel_loss: 0.1679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3460, loss: 0.5810, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||: 45%|####5 | 43/95 [00:28<00:33, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9618, LAS: 0.9249, UEM: 0.7016, LEM: 0.4716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1319, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5773, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||: 49%|####9 | 47/95 [00:31<00:30, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9609, LAS: 0.9244, UEM: 0.6875, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3932, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6016, loss: 0.5833, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 54%|#####3 | 51/95 [00:33<00:27, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9611, LAS: 0.9247, UEM: 0.6906, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1672, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4715, loss: 0.5804, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 58%|#####7 | 55/95 [00:35<00:23, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9598, LAS: 0.9234, UEM: 0.6782, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6884, partial_loss/deprel_loss: 0.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7135, loss: 0.5895, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 63%|######3 | 60/95 [00:38<00:19, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9594, LAS: 0.9229, UEM: 0.6681, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5827, loss: 0.5960, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 68%|######8 | 65/95 [00:40<00:15, 1.93it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9601, LAS: 0.9236, UEM: 0.6772, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2404, partial_loss/deprel_loss: 0.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.5907, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 73%|#######2 | 69/95 [00:43<00:16, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9607, LAS: 0.9241, UEM: 0.6831, LEM: 0.4510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1677, partial_loss/deprel_loss: 0.2805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4551, loss: 0.5868, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||: 77%|#######6 | 73/95 [00:46<00:14, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9604, LAS: 0.9236, UEM: 0.6764, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5734, partial_loss/deprel_loss: 0.4774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6938, loss: 0.5904, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||: 81%|########1 | 77/95 [00:49<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9603, LAS: 0.9236, UEM: 0.6720, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5311, partial_loss/deprel_loss: 0.5182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.5907, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||: 85%|########5 | 81/95 [00:52<00:09, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9596, LAS: 0.9229, UEM: 0.6633, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4483, partial_loss/deprel_loss: 0.4611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6557, loss: 0.5969, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||: 89%|########9 | 85/95 [00:55<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9596, LAS: 0.9229, UEM: 0.6591, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.3435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5223, loss: 0.5968, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||: 94%|#########3| 89/95 [00:57<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9599, LAS: 0.9233, UEM: 0.6637, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.5939, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||: 97%|#########6| 92/95 [01:00<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9600, LAS: 0.9233, UEM: 0.6597, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5936, batch_reg_loss: 0.1971, reg_loss: 0.1972 ||: 100%|##########| 95/95 [01:02<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9600, LAS: 0.9233, UEM: 0.6597, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5936, batch_reg_loss: 0.1971, reg_loss: 0.1972 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer - reg_loss | 0.197 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UEM | 0.660 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LEM | 0.426 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.286 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.337 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - loss | 0.594 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LAS | 0.923 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:28:48,308 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:28:53,247 - INFO - combo.training.trainer - Epoch duration: 0:01:10.348896\n", + "2023-04-07 01:28:53,248 - INFO - combo.training.trainer - Estimated training time remaining: 4:59:05\n", + "2023-04-07 01:28:53,248 - INFO - allennlp.training.trainer - Epoch 139/399\n", + "2023-04-07 01:28:53,248 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:28:53,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:28:53,260 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9606, LAS: 0.9218, UEM: 0.6580, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1156, partial_loss/deprel_loss: 0.2599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.5922, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||: 4%|4 | 4/95 [00:02<01:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9517, LAS: 0.9137, UEM: 0.6397, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.2646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4591, loss: 0.6459, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||: 7%|7 | 7/95 [00:04<01:01, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9240, UAS: 0.9535, LAS: 0.9163, UEM: 0.6238, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3397, partial_loss/deprel_loss: 0.3835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.6356, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||: 11%|# | 10/95 [00:07<01:03, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9587, LAS: 0.9227, UEM: 0.6995, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1266, partial_loss/deprel_loss: 0.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4367, loss: 0.5918, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||: 14%|#3 | 13/95 [00:10<01:02, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9599, LAS: 0.9239, UEM: 0.6762, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.4457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.5941, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||: 18%|#7 | 17/95 [00:12<00:55, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9584, LAS: 0.9223, UEM: 0.6474, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8026, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7622, loss: 0.6050, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||: 22%|##2 | 21/95 [00:14<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9586, LAS: 0.9222, UEM: 0.6493, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.6059, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 25%|##5 | 24/95 [00:17<00:50, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9588, LAS: 0.9221, UEM: 0.6425, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4044, partial_loss/deprel_loss: 0.3984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5966, loss: 0.6044, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 29%|##9 | 28/95 [00:19<00:45, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9609, LAS: 0.9247, UEM: 0.6930, LEM: 0.4803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2666, partial_loss/deprel_loss: 0.3292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.5868, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 33%|###2 | 31/95 [00:22<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9604, LAS: 0.9243, UEM: 0.6867, LEM: 0.4756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6902, partial_loss/deprel_loss: 0.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6989, loss: 0.5879, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 36%|###5 | 34/95 [00:24<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9604, LAS: 0.9243, UEM: 0.6827, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1529, partial_loss/deprel_loss: 0.2892, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4589, loss: 0.5894, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 40%|#### | 38/95 [00:27<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9598, LAS: 0.9235, UEM: 0.6741, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3820, partial_loss/deprel_loss: 0.4045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5970, loss: 0.5943, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||: 44%|####4 | 42/95 [00:29<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9596, LAS: 0.9232, UEM: 0.6796, LEM: 0.4645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1011, partial_loss/deprel_loss: 0.2468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5964, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 47%|####7 | 45/95 [00:32<00:36, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9592, LAS: 0.9226, UEM: 0.6667, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.6007, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 52%|#####1 | 49/95 [00:34<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9585, LAS: 0.9219, UEM: 0.6564, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4568, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7370, loss: 0.6071, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9590, LAS: 0.9223, UEM: 0.6594, LEM: 0.4388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.3183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.6044, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 58%|#####7 | 55/95 [00:38<00:28, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9227, UEM: 0.6548, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4273, partial_loss/deprel_loss: 0.3596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.6018, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 62%|######2 | 59/95 [00:41<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9588, LAS: 0.9220, UEM: 0.6436, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7359, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7569, loss: 0.6058, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 66%|######6 | 63/95 [00:43<00:21, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9595, LAS: 0.9227, UEM: 0.6474, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5647, partial_loss/deprel_loss: 0.4988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7089, loss: 0.6011, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 72%|#######1 | 68/95 [00:46<00:16, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9599, LAS: 0.9232, UEM: 0.6477, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3547, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.5981, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 77%|#######6 | 73/95 [00:48<00:12, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9603, LAS: 0.9237, UEM: 0.6488, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.5955, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||: 82%|########2 | 78/95 [00:50<00:08, 1.91it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9602, LAS: 0.9235, UEM: 0.6453, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6260, partial_loss/deprel_loss: 0.5170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.5959, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||: 86%|########6 | 82/95 [00:52<00:06, 1.93it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9609, LAS: 0.9244, UEM: 0.6631, LEM: 0.4377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0888, partial_loss/deprel_loss: 0.1850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3626, loss: 0.5888, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||: 91%|######### | 86/95 [00:55<00:05, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9613, LAS: 0.9247, UEM: 0.6672, LEM: 0.4403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5356, loss: 0.5864, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||: 95%|#########4| 90/95 [00:58<00:02, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9607, LAS: 0.9241, UEM: 0.6642, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2155, partial_loss/deprel_loss: 0.2877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.5906, batch_reg_loss: 0.1968, reg_loss: 0.1969 ||: 99%|#########8| 94/95 [01:01<00:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9608, LAS: 0.9244, UEM: 0.6660, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.2655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5890, batch_reg_loss: 0.1968, reg_loss: 0.1969 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 01:29:58,402 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - reg_loss | 0.197 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UEM | 0.666 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - LEM | 0.440 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EM | 0.947 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.172 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.266 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - loss | 0.589 | N/A\n", + "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:58,408 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:30:02,573 - INFO - combo.training.trainer - Epoch duration: 0:01:09.325241\n", + "2023-04-07 01:30:02,574 - INFO - combo.training.trainer - Estimated training time remaining: 4:57:57\n", + "2023-04-07 01:30:02,574 - INFO - allennlp.training.trainer - Epoch 140/399\n", + "2023-04-07 01:30:02,574 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:30:02,575 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:30:02,584 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9549, LAS: 0.9209, UEM: 0.4025, LEM: 0.1541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6574, loss: 0.6231, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||: 3%|3 | 3/95 [00:02<01:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9597, LAS: 0.9261, UEM: 0.5462, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4982, loss: 0.5811, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||: 6%|6 | 6/95 [00:04<01:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9625, LAS: 0.9282, UEM: 0.6070, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6043, loss: 0.5652, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||: 9%|9 | 9/95 [00:06<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9641, LAS: 0.9287, UEM: 0.6138, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.3618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5469, loss: 0.5624, batch_reg_loss: 0.1967, reg_loss: 0.1968 ||: 14%|#3 | 13/95 [00:09<00:58, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9634, LAS: 0.9279, UEM: 0.5874, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3066, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.5709, batch_reg_loss: 0.1967, reg_loss: 0.1968 ||: 18%|#7 | 17/95 [00:11<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9626, LAS: 0.9273, UEM: 0.6171, LEM: 0.3748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4825, loss: 0.5762, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||: 22%|##2 | 21/95 [00:14<00:50, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9621, LAS: 0.9271, UEM: 0.6139, LEM: 0.3754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5532, partial_loss/deprel_loss: 0.4882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6979, loss: 0.5798, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||: 26%|##6 | 25/95 [00:16<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9642, LAS: 0.9293, UEM: 0.6653, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1061, partial_loss/deprel_loss: 0.2268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3993, loss: 0.5612, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||: 31%|### | 29/95 [00:19<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9648, LAS: 0.9300, UEM: 0.6708, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1593, partial_loss/deprel_loss: 0.2767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.5571, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||: 34%|###3 | 32/95 [00:21<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9654, LAS: 0.9306, UEM: 0.6747, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3367, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5531, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 37%|###6 | 35/95 [00:23<00:40, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9647, LAS: 0.9300, UEM: 0.6875, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0927, partial_loss/deprel_loss: 0.1957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3717, loss: 0.5578, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 40%|#### | 38/95 [00:25<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9653, LAS: 0.9305, UEM: 0.6997, LEM: 0.4698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1231, partial_loss/deprel_loss: 0.2722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4390, loss: 0.5533, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 43%|####3 | 41/95 [00:28<00:38, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9630, LAS: 0.9282, UEM: 0.6846, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.5681, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 46%|####6 | 44/95 [00:30<00:36, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9621, LAS: 0.9270, UEM: 0.6746, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4848, loss: 0.5769, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 51%|##### | 48/95 [00:33<00:33, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9622, LAS: 0.9273, UEM: 0.6796, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4518, partial_loss/deprel_loss: 0.4611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.5744, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 54%|#####3 | 51/95 [00:35<00:32, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9606, LAS: 0.9253, UEM: 0.6697, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.5853, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 58%|#####7 | 55/95 [00:38<00:28, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9613, LAS: 0.9259, UEM: 0.6830, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1258, partial_loss/deprel_loss: 0.2682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.5806, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||: 61%|######1 | 58/95 [00:41<00:29, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9614, LAS: 0.9258, UEM: 0.6792, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.5810, batch_reg_loss: 0.1965, reg_loss: 0.1967 ||: 65%|######5 | 62/95 [00:43<00:23, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9615, LAS: 0.9259, UEM: 0.6776, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.3455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5802, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 69%|######9 | 66/95 [00:45<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9615, LAS: 0.9259, UEM: 0.6753, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6507, partial_loss/deprel_loss: 0.5641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7780, loss: 0.5807, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 73%|#######2 | 69/95 [00:48<00:18, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9606, LAS: 0.9247, UEM: 0.6655, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3926, partial_loss/deprel_loss: 0.4924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.5882, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 77%|#######6 | 73/95 [00:50<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9603, LAS: 0.9245, UEM: 0.6605, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5515, loss: 0.5893, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 80%|######## | 76/95 [00:52<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9606, LAS: 0.9246, UEM: 0.6631, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.5882, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 83%|########3 | 79/95 [00:54<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9603, LAS: 0.9243, UEM: 0.6587, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.5910, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 87%|########7 | 83/95 [00:57<00:08, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9356, UAS: 0.9602, LAS: 0.9242, UEM: 0.6559, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5021, loss: 0.5927, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 93%|#########2| 88/95 [00:59<00:04, 1.62it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9603, LAS: 0.9242, UEM: 0.6540, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2837, partial_loss/deprel_loss: 0.3571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5389, loss: 0.5917, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 98%|#########7| 93/95 [01:02<00:01, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9603, LAS: 0.9243, UEM: 0.6653, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8845, partial_loss/deprel_loss: 0.5812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8383, loss: 0.5912, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 100%|##########| 95/95 [01:03<00:00, 1.50it/s]\n", + "2023-04-07 01:31:09,161 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9528, LAS: 0.9029, UEM: 0.8072, LEM: 0.6049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0580, partial_loss/deprel_loss: 15.0226, partial_loss/cycle_loss: 0.0000, batch_loss: 12.2297, loss: 8.1817, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:09, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9521, LAS: 0.9017, UEM: 0.7197, LEM: 0.4644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3701, partial_loss/deprel_loss: 7.7624, partial_loss/cycle_loss: 0.0000, batch_loss: 6.2839, loss: 8.5380, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:06, 1.02s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9540, LAS: 0.9034, UEM: 0.7199, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 5.8722, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7387, loss: 7.7018, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:03, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9512, LAS: 0.9000, UEM: 0.6878, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 10.7496, partial_loss/cycle_loss: 0.0000, batch_loss: 8.7834, loss: 8.3488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9512, LAS: 0.9000, UEM: 0.6878, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 10.7496, partial_loss/cycle_loss: 0.0000, batch_loss: 8.7834, loss: 8.3488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.00it/s]\n", + "2023-04-07 01:31:20,174 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - reg_loss | 0.197 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UEM | 0.665 | 0.688\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - LEM | 0.439 | 0.410\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EM | 0.888 | 0.892\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.884 | 0.919\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | 0.951\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.581 | 10.750\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - loss | 0.591 | 8.349\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | 0.900\n", + "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:31:20,180 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:31:24,963 - INFO - combo.training.trainer - Epoch duration: 0:01:22.388611\n", + "2023-04-07 01:31:24,963 - INFO - combo.training.trainer - Estimated training time remaining: 4:57:13\n", + "2023-04-07 01:31:24,963 - INFO - allennlp.training.trainer - Epoch 141/399\n", + "2023-04-07 01:31:24,963 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:31:24,964 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:31:24,973 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9714, LAS: 0.9367, UEM: 0.7460, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4991, loss: 0.5037, batch_reg_loss: 0.1965, reg_loss: 0.1965 ||: 3%|3 | 3/95 [00:02<01:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9701, LAS: 0.9349, UEM: 0.7408, LEM: 0.4896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2253, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.5114, batch_reg_loss: 0.1965, reg_loss: 0.1965 ||: 6%|6 | 6/95 [00:04<01:12, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9699, LAS: 0.9346, UEM: 0.7492, LEM: 0.5091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4965, partial_loss/deprel_loss: 0.4303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6400, loss: 0.5193, batch_reg_loss: 0.1964, reg_loss: 0.1965 ||: 9%|9 | 9/95 [00:07<01:10, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9700, LAS: 0.9353, UEM: 0.7390, LEM: 0.4933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1402, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.5176, batch_reg_loss: 0.1964, reg_loss: 0.1965 ||: 14%|#3 | 13/95 [00:10<01:03, 1.29it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9668, LAS: 0.9321, UEM: 0.6963, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5385, loss: 0.5396, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 18%|#7 | 17/95 [00:12<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9660, LAS: 0.9314, UEM: 0.6880, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1620, partial_loss/deprel_loss: 0.2415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4220, loss: 0.5408, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9640, LAS: 0.9295, UEM: 0.6576, LEM: 0.4233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6444, loss: 0.5569, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 25%|##5 | 24/95 [00:17<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9644, LAS: 0.9299, UEM: 0.6597, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3868, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5541, loss: 0.5500, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 28%|##8 | 27/95 [00:19<00:47, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9650, LAS: 0.9310, UEM: 0.6749, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5194, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6652, loss: 0.5463, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||: 33%|###2 | 31/95 [00:21<00:43, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9653, LAS: 0.9308, UEM: 0.6795, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1588, partial_loss/deprel_loss: 0.3028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.5468, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 37%|###6 | 35/95 [00:24<00:41, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9639, LAS: 0.9294, UEM: 0.6681, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6353, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6959, loss: 0.5570, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 40%|#### | 38/95 [00:27<00:40, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9635, LAS: 0.9291, UEM: 0.6576, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4292, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.5602, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 43%|####3 | 41/95 [00:29<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9636, LAS: 0.9291, UEM: 0.6645, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.4647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6832, loss: 0.5583, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 47%|####7 | 45/95 [00:32<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9643, LAS: 0.9298, UEM: 0.6827, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4058, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5840, loss: 0.5532, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 51%|##### | 48/95 [00:34<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9627, LAS: 0.9279, UEM: 0.6729, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7541, loss: 0.5667, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9612, LAS: 0.9263, UEM: 0.6632, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5556, loss: 0.5758, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 58%|#####7 | 55/95 [00:39<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9617, LAS: 0.9264, UEM: 0.6674, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5713, partial_loss/deprel_loss: 0.5004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7109, loss: 0.5742, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 62%|######2 | 59/95 [00:41<00:25, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9613, LAS: 0.9259, UEM: 0.6627, LEM: 0.4299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7711, partial_loss/deprel_loss: 0.4545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.5765, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 65%|######5 | 62/95 [00:43<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9620, LAS: 0.9269, UEM: 0.6826, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5707, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 68%|######8 | 65/95 [00:46<00:22, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9619, LAS: 0.9268, UEM: 0.6770, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.5722, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||: 72%|#######1 | 68/95 [00:48<00:19, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9623, LAS: 0.9269, UEM: 0.6827, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4133, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6101, loss: 0.5706, batch_reg_loss: 0.1962, reg_loss: 0.1964 ||: 75%|#######4 | 71/95 [00:50<00:17, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9613, LAS: 0.9259, UEM: 0.6748, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8964, partial_loss/deprel_loss: 0.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7943, loss: 0.5785, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 78%|#######7 | 74/95 [00:53<00:15, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9617, LAS: 0.9263, UEM: 0.6787, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1303, partial_loss/deprel_loss: 0.2875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4523, loss: 0.5757, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 81%|########1 | 77/95 [00:55<00:13, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9610, LAS: 0.9255, UEM: 0.6708, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.5810, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 85%|########5 | 81/95 [00:57<00:09, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9613, LAS: 0.9257, UEM: 0.6749, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5795, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 89%|########9 | 85/95 [00:59<00:06, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9608, LAS: 0.9253, UEM: 0.6695, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.4059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5769, loss: 0.5848, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 95%|#########4| 90/95 [01:01<00:02, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9602, LAS: 0.9246, UEM: 0.6635, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5889, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 100%|##########| 95/95 [01:04<00:00, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9602, LAS: 0.9246, UEM: 0.6635, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5889, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 100%|##########| 95/95 [01:04<00:00, 1.48it/s]\n", + "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - reg_loss | 0.196 | N/A\n", + "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UEM | 0.663 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LEM | 0.438 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - EM | 0.919 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.289 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.446 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - loss | 0.589 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LAS | 0.925 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:32,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:32,433 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:32:37,205 - INFO - combo.training.trainer - Epoch duration: 0:01:12.242078\n", + "2023-04-07 01:32:37,206 - INFO - combo.training.trainer - Estimated training time remaining: 4:56:11\n", + "2023-04-07 01:32:37,206 - INFO - allennlp.training.trainer - Epoch 142/399\n", + "2023-04-07 01:32:37,206 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:32:37,207 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:32:37,216 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9777, LAS: 0.9494, UEM: 0.8833, LEM: 0.7480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0388, partial_loss/deprel_loss: 0.1253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3042, loss: 0.4407, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||: 3%|3 | 3/95 [00:02<01:22, 1.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9649, LAS: 0.9341, UEM: 0.7764, LEM: 0.6172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7783, partial_loss/deprel_loss: 0.5240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7710, loss: 0.5270, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||: 7%|7 | 7/95 [00:05<01:11, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9649, LAS: 0.9322, UEM: 0.7507, LEM: 0.5661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5494, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6801, loss: 0.5340, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||: 11%|# | 10/95 [00:07<01:06, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9620, LAS: 0.9283, UEM: 0.6980, LEM: 0.5131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4609, partial_loss/deprel_loss: 0.4467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.5675, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||: 14%|#3 | 13/95 [00:09<01:04, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9587, LAS: 0.9246, UEM: 0.6785, LEM: 0.4945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0301, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8946, loss: 0.5862, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||: 17%|#6 | 16/95 [00:12<01:02, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9356, UAS: 0.9591, LAS: 0.9244, UEM: 0.6665, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.3529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5871, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||: 20%|## | 19/95 [00:14<00:59, 1.28it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9596, LAS: 0.9249, UEM: 0.6609, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6963, partial_loss/deprel_loss: 0.5092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7427, loss: 0.5863, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||: 23%|##3 | 22/95 [00:16<00:55, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9600, LAS: 0.9255, UEM: 0.6505, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5659, loss: 0.5816, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||: 27%|##7 | 26/95 [00:19<00:50, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9594, LAS: 0.9246, UEM: 0.6400, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1459, partial_loss/deprel_loss: 0.2655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4377, loss: 0.5892, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||: 32%|###1 | 30/95 [00:21<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9601, LAS: 0.9252, UEM: 0.6502, LEM: 0.4362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1923, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5043, loss: 0.5835, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||: 36%|###5 | 34/95 [00:24<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9610, LAS: 0.9259, UEM: 0.6487, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2934, partial_loss/deprel_loss: 0.3326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.5772, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||: 40%|#### | 38/95 [00:27<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9602, LAS: 0.9251, UEM: 0.6432, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6596, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7616, loss: 0.5861, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||: 44%|####4 | 42/95 [00:29<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9589, LAS: 0.9238, UEM: 0.6306, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3692, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.5962, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||: 48%|####8 | 46/95 [00:32<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9595, LAS: 0.9244, UEM: 0.6349, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5964, loss: 0.5920, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||: 52%|#####1 | 49/95 [00:34<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9596, LAS: 0.9245, UEM: 0.6418, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1112, partial_loss/deprel_loss: 0.2305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4027, loss: 0.5904, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 55%|#####4 | 52/95 [00:36<00:30, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9600, LAS: 0.9247, UEM: 0.6388, LEM: 0.4148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3810, partial_loss/deprel_loss: 0.3844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.5873, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 59%|#####8 | 56/95 [00:39<00:26, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9599, LAS: 0.9246, UEM: 0.6323, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2395, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5199, loss: 0.5898, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 63%|######3 | 60/95 [00:41<00:23, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9607, LAS: 0.9254, UEM: 0.6508, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1561, partial_loss/deprel_loss: 0.2461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4241, loss: 0.5838, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 67%|######7 | 64/95 [00:45<00:22, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9607, LAS: 0.9255, UEM: 0.6534, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.5826, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 71%|####### | 67/95 [00:47<00:21, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9614, LAS: 0.9263, UEM: 0.6692, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.5763, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 74%|#######3 | 70/95 [00:50<00:19, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9607, LAS: 0.9256, UEM: 0.6611, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4577, partial_loss/deprel_loss: 0.4822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6733, loss: 0.5809, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 77%|#######6 | 73/95 [00:52<00:16, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9603, LAS: 0.9251, UEM: 0.6563, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6469, partial_loss/deprel_loss: 0.5195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7410, loss: 0.5840, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||: 80%|######## | 76/95 [00:54<00:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9606, LAS: 0.9252, UEM: 0.6554, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.5840, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 84%|########4 | 80/95 [00:57<00:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9608, LAS: 0.9254, UEM: 0.6583, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2209, partial_loss/deprel_loss: 0.3497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5198, loss: 0.5823, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 88%|########8 | 84/95 [00:59<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9605, LAS: 0.9248, UEM: 0.6545, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3878, partial_loss/deprel_loss: 0.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6208, loss: 0.5860, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 93%|#########2| 88/95 [01:02<00:04, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9608, LAS: 0.9254, UEM: 0.6593, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0785, partial_loss/deprel_loss: 0.2125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3816, loss: 0.5826, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 97%|#########6| 92/95 [01:05<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9607, LAS: 0.9253, UEM: 0.6619, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5634, loss: 0.5830, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 100%|##########| 95/95 [01:07<00:00, 1.42it/s]\n", + "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer - reg_loss | 0.196 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UEM | 0.662 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - LEM | 0.441 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.305 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.383 | N/A\n", + "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - loss | 0.583 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - LAS | 0.925 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:47,068 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:33:55,192 - INFO - combo.training.trainer - Epoch duration: 0:01:17.985545\n", + "2023-04-07 01:33:55,192 - INFO - combo.training.trainer - Estimated training time remaining: 4:55:18\n", + "2023-04-07 01:33:55,192 - INFO - allennlp.training.trainer - Epoch 143/399\n", + "2023-04-07 01:33:55,193 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:33:55,193 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:33:55,204 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9612, LAS: 0.9258, UEM: 0.6181, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1987, partial_loss/deprel_loss: 0.3033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4783, loss: 0.5987, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||: 3%|3 | 3/95 [00:02<01:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9610, LAS: 0.9261, UEM: 0.6852, LEM: 0.4737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1229, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4144, loss: 0.5864, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9638, LAS: 0.9298, UEM: 0.7018, LEM: 0.4829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4217, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.5592, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||: 9%|9 | 9/95 [00:06<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9642, LAS: 0.9291, UEM: 0.6939, LEM: 0.4609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3576, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6270, loss: 0.5620, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||: 14%|#3 | 13/95 [00:08<00:55, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9656, LAS: 0.9312, UEM: 0.6985, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2052, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5495, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||: 17%|#6 | 16/95 [00:10<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9652, LAS: 0.9304, UEM: 0.6762, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.4123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5898, loss: 0.5570, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||: 21%|##1 | 20/95 [00:13<00:49, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9641, LAS: 0.9292, UEM: 0.6711, LEM: 0.4237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8708, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8329, loss: 0.5636, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||: 25%|##5 | 24/95 [00:15<00:46, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9606, LAS: 0.9258, UEM: 0.6350, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7316, partial_loss/deprel_loss: 0.4971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.5861, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||: 29%|##9 | 28/95 [00:18<00:42, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9622, LAS: 0.9276, UEM: 0.6612, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1479, partial_loss/deprel_loss: 0.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.5753, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||: 33%|###2 | 31/95 [00:20<00:42, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9620, LAS: 0.9273, UEM: 0.6577, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.5765, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||: 37%|###6 | 35/95 [00:23<00:39, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9617, LAS: 0.9270, UEM: 0.6629, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.5802, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||: 41%|####1 | 39/95 [00:25<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9618, LAS: 0.9267, UEM: 0.6589, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1680, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.5808, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||: 45%|####5 | 43/95 [00:28<00:34, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9605, LAS: 0.9251, UEM: 0.6532, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1675, partial_loss/deprel_loss: 0.5706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8857, loss: 0.5888, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||: 49%|####9 | 47/95 [00:31<00:32, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9607, LAS: 0.9252, UEM: 0.6515, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5322, loss: 0.5878, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 53%|#####2 | 50/95 [00:33<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9607, LAS: 0.9253, UEM: 0.6461, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3210, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.5878, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 56%|#####5 | 53/95 [00:35<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9604, LAS: 0.9249, UEM: 0.6493, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6948, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7829, loss: 0.5891, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 60%|###### | 57/95 [00:38<00:25, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9609, LAS: 0.9253, UEM: 0.6618, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2951, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5847, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 63%|######3 | 60/95 [00:40<00:24, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9613, LAS: 0.9257, UEM: 0.6606, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1720, partial_loss/deprel_loss: 0.2721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4478, loss: 0.5817, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 67%|######7 | 64/95 [00:42<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9612, LAS: 0.9256, UEM: 0.6601, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1927, partial_loss/deprel_loss: 0.2857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4628, loss: 0.5822, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 71%|####### | 67/95 [00:45<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9606, LAS: 0.9249, UEM: 0.6512, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4352, partial_loss/deprel_loss: 0.4888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6738, loss: 0.5877, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 74%|#######3 | 70/95 [00:47<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9605, LAS: 0.9247, UEM: 0.6530, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0181, partial_loss/deprel_loss: 0.5776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8614, loss: 0.5887, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 77%|#######6 | 73/95 [00:49<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9605, LAS: 0.9248, UEM: 0.6503, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6608, loss: 0.5886, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 80%|######## | 76/95 [00:51<00:13, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9610, LAS: 0.9253, UEM: 0.6573, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2688, partial_loss/deprel_loss: 0.3295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5130, loss: 0.5846, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 83%|########3 | 79/95 [00:54<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9608, LAS: 0.9250, UEM: 0.6565, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6618, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7311, loss: 0.5867, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||: 86%|########6 | 82/95 [00:56<00:09, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9610, LAS: 0.9251, UEM: 0.6557, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2986, partial_loss/deprel_loss: 0.3646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.5860, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 89%|########9 | 85/95 [00:58<00:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9736, UAS: 0.9613, LAS: 0.9255, UEM: 0.6675, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0363, partial_loss/deprel_loss: 0.0917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2763, loss: 0.5831, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 93%|#########2| 88/95 [01:01<00:05, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9614, LAS: 0.9255, UEM: 0.6705, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0890, partial_loss/deprel_loss: 0.2279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3958, loss: 0.5836, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 96%|#########5| 91/95 [01:03<00:03, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9613, LAS: 0.9255, UEM: 0.6654, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.5830, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 100%|##########| 95/95 [01:05<00:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9613, LAS: 0.9255, UEM: 0.6654, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.5830, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 100%|##########| 95/95 [01:05<00:00, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - reg_loss | 0.196 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UEM | 0.665 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - LEM | 0.440 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EM | 0.918 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.378 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.385 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - loss | 0.583 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - LAS | 0.925 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:35:03,853 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:35:08,540 - INFO - combo.training.trainer - Epoch duration: 0:01:13.347534\n", + "2023-04-07 01:35:08,540 - INFO - combo.training.trainer - Estimated training time remaining: 4:54:17\n", + "2023-04-07 01:35:08,541 - INFO - allennlp.training.trainer - Epoch 144/399\n", + "2023-04-07 01:35:08,541 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:35:08,542 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:35:08,551 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9723, LAS: 0.9370, UEM: 0.7976, LEM: 0.5757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1629, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4709, loss: 0.5066, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||: 5%|5 | 5/95 [00:02<00:47, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9633, LAS: 0.9280, UEM: 0.7085, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5152, partial_loss/deprel_loss: 0.4897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6904, loss: 0.5663, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||: 9%|9 | 9/95 [00:05<00:47, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9630, LAS: 0.9273, UEM: 0.6953, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.5254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7254, loss: 0.5694, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||: 13%|#2 | 12/95 [00:07<00:49, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9614, LAS: 0.9258, UEM: 0.6516, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3085, partial_loss/deprel_loss: 0.3481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5357, loss: 0.5813, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||: 17%|#6 | 16/95 [00:09<00:46, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9621, LAS: 0.9269, UEM: 0.6642, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5289, partial_loss/deprel_loss: 0.4735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6802, loss: 0.5716, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||: 20%|## | 19/95 [00:11<00:47, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9613, LAS: 0.9260, UEM: 0.6528, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6241, partial_loss/deprel_loss: 0.5382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.5783, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||: 24%|##4 | 23/95 [00:13<00:42, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9623, LAS: 0.9268, UEM: 0.6690, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1259, partial_loss/deprel_loss: 0.3156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4732, loss: 0.5720, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||: 28%|##8 | 27/95 [00:15<00:39, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9632, LAS: 0.9280, UEM: 0.6748, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5678, loss: 0.5657, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||: 34%|###3 | 32/95 [00:18<00:34, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9645, LAS: 0.9294, UEM: 0.6863, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1585, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4508, loss: 0.5558, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||: 38%|###7 | 36/95 [00:20<00:31, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9647, LAS: 0.9295, UEM: 0.6900, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3195, partial_loss/deprel_loss: 0.3555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.5537, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||: 42%|####2 | 40/95 [00:23<00:32, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9651, LAS: 0.9299, UEM: 0.6876, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3535, partial_loss/deprel_loss: 0.3828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5724, loss: 0.5509, batch_reg_loss: 0.1955, reg_loss: 0.1955 ||: 46%|####6 | 44/95 [00:25<00:31, 1.64it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9651, LAS: 0.9301, UEM: 0.7024, LEM: 0.4781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8110, partial_loss/deprel_loss: 0.5529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8000, loss: 0.5480, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 51%|##### | 48/95 [00:28<00:31, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9646, LAS: 0.9293, UEM: 0.6907, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5458, partial_loss/deprel_loss: 0.4938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.5549, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 55%|#####4 | 52/95 [00:31<00:28, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9645, LAS: 0.9294, UEM: 0.6857, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1897, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.5570, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9640, LAS: 0.9288, UEM: 0.6758, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.5605, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 62%|######2 | 59/95 [00:36<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9634, LAS: 0.9284, UEM: 0.6720, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5894, partial_loss/deprel_loss: 0.5012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7142, loss: 0.5645, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 65%|######5 | 62/95 [00:39<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9638, LAS: 0.9287, UEM: 0.6787, LEM: 0.4522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1116, partial_loss/deprel_loss: 0.2341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4050, loss: 0.5608, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 68%|######8 | 65/95 [00:41<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9633, LAS: 0.9283, UEM: 0.6693, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5677, loss: 0.5637, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 73%|#######2 | 69/95 [00:43<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9629, LAS: 0.9280, UEM: 0.6674, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7485, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7062, loss: 0.5651, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 76%|#######5 | 72/95 [00:45<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9269, UEM: 0.6596, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3724, partial_loss/deprel_loss: 0.3970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5729, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 79%|#######8 | 75/95 [00:48<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9619, LAS: 0.9271, UEM: 0.6603, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3534, partial_loss/deprel_loss: 0.4346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.5717, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||: 82%|########2 | 78/95 [00:50<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9615, LAS: 0.9268, UEM: 0.6553, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2096, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.5751, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 86%|########6 | 82/95 [00:52<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9619, LAS: 0.9272, UEM: 0.6680, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0249, partial_loss/deprel_loss: 0.1024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2823, loss: 0.5727, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 89%|########9 | 85/95 [00:55<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9620, LAS: 0.9273, UEM: 0.6675, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2200, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5166, loss: 0.5713, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 93%|#########2| 88/95 [00:57<00:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8677, UAS: 0.9617, LAS: 0.9269, UEM: 0.6699, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1521, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9512, loss: 0.5735, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 96%|#########5| 91/95 [00:59<00:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9613, LAS: 0.9264, UEM: 0.6673, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5637, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 0.5766, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 99%|#########8| 94/95 [01:01<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9610, LAS: 0.9261, UEM: 0.6648, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8027, partial_loss/deprel_loss: 0.5686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8107, loss: 0.5790, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 100%|##########| 95/95 [01:02<00:00, 1.53it/s]\n", + "2023-04-07 01:36:13,968 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - reg_loss | 0.195 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UEM | 0.665 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - LEM | 0.444 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EM | 0.896 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.803 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.569 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - loss | 0.579 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:13,975 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:36:18,797 - INFO - combo.training.trainer - Epoch duration: 0:01:10.256214\n", + "2023-04-07 01:36:18,797 - INFO - combo.training.trainer - Estimated training time remaining: 4:53:10\n", + "2023-04-07 01:36:18,797 - INFO - allennlp.training.trainer - Epoch 145/399\n", + "2023-04-07 01:36:18,798 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:36:18,798 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:36:18,805 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9674, LAS: 0.9300, UEM: 0.6255, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3173, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5049, loss: 0.5278, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 3%|3 | 3/95 [00:02<01:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9622, LAS: 0.9265, UEM: 0.5693, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5101, partial_loss/deprel_loss: 0.4328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.5750, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9651, LAS: 0.9292, UEM: 0.6349, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4242, partial_loss/deprel_loss: 0.4547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6439, loss: 0.5553, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 9%|9 | 9/95 [00:06<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9640, LAS: 0.9284, UEM: 0.6207, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.5611, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 14%|#3 | 13/95 [00:09<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9604, LAS: 0.9250, UEM: 0.5805, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2846, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5378, loss: 0.5831, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 18%|#7 | 17/95 [00:11<00:53, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9618, LAS: 0.9270, UEM: 0.6036, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4053, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6467, loss: 0.5713, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 21%|##1 | 20/95 [00:13<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9616, LAS: 0.9270, UEM: 0.6131, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2207, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5725, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||: 24%|##4 | 23/95 [00:16<00:53, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9614, LAS: 0.9270, UEM: 0.6195, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7586, partial_loss/deprel_loss: 0.5081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7535, loss: 0.5743, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||: 27%|##7 | 26/95 [00:18<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9593, LAS: 0.9252, UEM: 0.5982, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5271, partial_loss/deprel_loss: 0.4619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6701, loss: 0.5885, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||: 32%|###1 | 30/95 [00:20<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9583, LAS: 0.9241, UEM: 0.5792, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5811, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.5922, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||: 37%|###6 | 35/95 [00:23<00:37, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9250, UEM: 0.5971, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3866, partial_loss/deprel_loss: 0.4137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.5853, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||: 42%|####2 | 40/95 [00:25<00:31, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9598, LAS: 0.9258, UEM: 0.6005, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2454, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.5803, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||: 47%|####7 | 45/95 [00:27<00:26, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9589, LAS: 0.9247, UEM: 0.6081, LEM: 0.3712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1542, partial_loss/deprel_loss: 0.3116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4753, loss: 0.5880, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||: 52%|#####1 | 49/95 [00:29<00:24, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9588, LAS: 0.9248, UEM: 0.6300, LEM: 0.4076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0358, partial_loss/deprel_loss: 0.1138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2934, loss: 0.5870, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||: 56%|#####5 | 53/95 [00:32<00:23, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9597, LAS: 0.9255, UEM: 0.6463, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.5811, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||: 60%|###### | 57/95 [00:35<00:23, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9604, LAS: 0.9261, UEM: 0.6547, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3106, partial_loss/deprel_loss: 0.3452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.5771, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||: 64%|######4 | 61/95 [00:38<00:22, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9610, LAS: 0.9265, UEM: 0.6585, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1048, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4224, loss: 0.5743, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 68%|######8 | 65/95 [00:41<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9617, LAS: 0.9271, UEM: 0.6651, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2053, partial_loss/deprel_loss: 0.2998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5705, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 73%|#######2 | 69/95 [00:44<00:17, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9602, LAS: 0.9255, UEM: 0.6554, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0145, partial_loss/deprel_loss: 0.6211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8949, loss: 0.5812, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 77%|#######6 | 73/95 [00:46<00:14, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9605, LAS: 0.9257, UEM: 0.6660, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1002, partial_loss/deprel_loss: 0.1881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3656, loss: 0.5797, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 81%|########1 | 77/95 [00:49<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9605, LAS: 0.9256, UEM: 0.6679, LEM: 0.4412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1022, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4293, loss: 0.5810, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 84%|########4 | 80/95 [00:52<00:10, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9605, LAS: 0.9255, UEM: 0.6646, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4826, loss: 0.5823, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 87%|########7 | 83/95 [00:54<00:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9604, LAS: 0.9253, UEM: 0.6573, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3819, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6033, loss: 0.5847, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 92%|#########1| 87/95 [00:56<00:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9609, LAS: 0.9258, UEM: 0.6642, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1931, partial_loss/deprel_loss: 0.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5812, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 96%|#########5| 91/95 [00:59<00:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9611, LAS: 0.9259, UEM: 0.6668, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1362, partial_loss/deprel_loss: 0.3189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4774, loss: 0.5804, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||: 99%|#########8| 94/95 [01:01<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9612, LAS: 0.9261, UEM: 0.6660, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2646, partial_loss/deprel_loss: 0.2843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.5793, batch_reg_loss: 0.1950, reg_loss: 0.1952 ||: 100%|##########| 95/95 [01:02<00:00, 1.52it/s]\n", + "2023-04-07 01:37:24,348 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9470, LAS: 0.9012, UEM: 0.8096, LEM: 0.6413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5334, partial_loss/deprel_loss: 19.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9854, loss: 10.0469, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 18%|#8 | 2/11 [00:02<00:10, 1.20s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9530, LAS: 0.9044, UEM: 0.7198, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8728, partial_loss/deprel_loss: 10.5768, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6360, loss: 8.1821, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:06, 1.09s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9476, LAS: 0.8963, UEM: 0.6564, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2028, partial_loss/deprel_loss: 16.7362, partial_loss/cycle_loss: 0.0000, batch_loss: 13.6295, loss: 9.5178, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:07<00:04, 1.09s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9507, LAS: 0.8985, UEM: 0.6791, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0512, partial_loss/deprel_loss: 9.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 7.7174, loss: 8.5489, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:09<00:01, 1.05s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9523, LAS: 0.9007, UEM: 0.6903, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4198, partial_loss/deprel_loss: 6.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1963, loss: 8.2441, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02it/s]\n", + "2023-04-07 01:37:35,130 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - reg_loss | 0.195 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UEM | 0.666 | 0.690\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - LEM | 0.437 | 0.407\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EM | 0.940 | 0.923\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.265 | 0.420\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | 0.952\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.284 | 6.390\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - loss | 0.579 | 8.244\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | 0.901\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:37:35,137 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:37:39,900 - INFO - combo.training.trainer - Epoch duration: 0:01:21.102822\n", + "2023-04-07 01:37:39,901 - INFO - combo.training.trainer - Estimated training time remaining: 4:52:22\n", + "2023-04-07 01:37:39,901 - INFO - allennlp.training.trainer - Epoch 146/399\n", + "2023-04-07 01:37:39,905 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:37:39,906 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:37:39,913 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9768, LAS: 0.9408, UEM: 0.8439, LEM: 0.6231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1214, partial_loss/deprel_loss: 0.2641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.4573, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 3%|3 | 3/95 [00:02<01:18, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9656, LAS: 0.9303, UEM: 0.7362, LEM: 0.5173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2008, partial_loss/deprel_loss: 0.2163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5202, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 7%|7 | 7/95 [00:05<01:10, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9653, LAS: 0.9298, UEM: 0.7205, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5366, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 11%|# | 10/95 [00:07<01:07, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9647, LAS: 0.9291, UEM: 0.7005, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5481, partial_loss/deprel_loss: 0.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6742, loss: 0.5476, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 14%|#3 | 13/95 [00:09<01:02, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9629, LAS: 0.9284, UEM: 0.6838, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 0.2970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4745, loss: 0.5543, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 18%|#7 | 17/95 [00:12<00:57, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9616, LAS: 0.9267, UEM: 0.6563, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2811, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.5677, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 21%|##1 | 20/95 [00:14<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9622, LAS: 0.9272, UEM: 0.6612, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4932, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6804, loss: 0.5689, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 25%|##5 | 24/95 [00:16<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9633, LAS: 0.9285, UEM: 0.6871, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6006, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.5618, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||: 28%|##8 | 27/95 [00:18<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9643, LAS: 0.9289, UEM: 0.6968, LEM: 0.4663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.3049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5555, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 32%|###1 | 30/95 [00:21<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9625, LAS: 0.9271, UEM: 0.6957, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9823, partial_loss/deprel_loss: 0.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.5663, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 36%|###5 | 34/95 [00:23<00:39, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9636, LAS: 0.9282, UEM: 0.6939, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4423, loss: 0.5609, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 41%|####1 | 39/95 [00:25<00:33, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9639, LAS: 0.9289, UEM: 0.6881, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1559, partial_loss/deprel_loss: 0.3300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4901, loss: 0.5559, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 46%|####6 | 44/95 [00:27<00:27, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9631, LAS: 0.9280, UEM: 0.6779, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4824, partial_loss/deprel_loss: 0.4924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6853, loss: 0.5623, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 52%|#####1 | 49/95 [00:30<00:24, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9618, LAS: 0.9267, UEM: 0.6693, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2899, partial_loss/deprel_loss: 0.3352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.5714, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 56%|#####5 | 53/95 [00:33<00:24, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9617, LAS: 0.9264, UEM: 0.6631, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.4529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6362, loss: 0.5723, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||: 60%|###### | 57/95 [00:35<00:21, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9621, LAS: 0.9268, UEM: 0.6765, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7021, loss: 0.5705, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 64%|######4 | 61/95 [00:38<00:21, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9621, LAS: 0.9267, UEM: 0.6761, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4551, partial_loss/deprel_loss: 0.4019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6074, loss: 0.5689, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 68%|######8 | 65/95 [00:41<00:20, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9622, LAS: 0.9267, UEM: 0.6769, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6631, partial_loss/deprel_loss: 0.5134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7382, loss: 0.5699, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 73%|#######2 | 69/95 [00:44<00:17, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9615, LAS: 0.9261, UEM: 0.6703, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.3933, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.5745, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 76%|#######5 | 72/95 [00:46<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9615, LAS: 0.9261, UEM: 0.6662, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2535, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.5748, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 79%|#######8 | 75/95 [00:48<00:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9614, LAS: 0.9259, UEM: 0.6647, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2812, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5207, loss: 0.5753, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 83%|########3 | 79/95 [00:50<00:10, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9616, LAS: 0.9261, UEM: 0.6633, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.2803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4684, loss: 0.5736, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 87%|########7 | 83/95 [00:53<00:07, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9613, LAS: 0.9258, UEM: 0.6611, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5645, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6726, loss: 0.5760, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 92%|#########1| 87/95 [00:55<00:05, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9615, LAS: 0.9260, UEM: 0.6667, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8177, partial_loss/deprel_loss: 0.6482, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8769, loss: 0.5753, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 96%|#########5| 91/95 [00:58<00:02, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9611, LAS: 0.9257, UEM: 0.6636, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.4946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5771, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 100%|##########| 95/95 [01:01<00:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9611, LAS: 0.9257, UEM: 0.6636, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.4946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5771, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - reg_loss | 0.195 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UEM | 0.664 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - LEM | 0.442 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EM | 0.905 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.794 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.495 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - loss | 0.577 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | N/A\n", + "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:44,424 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:38:49,391 - INFO - combo.training.trainer - Epoch duration: 0:01:09.489946\n", + "2023-04-07 01:38:49,391 - INFO - combo.training.trainer - Estimated training time remaining: 4:51:14\n", + "2023-04-07 01:38:49,391 - INFO - allennlp.training.trainer - Epoch 147/399\n", + "2023-04-07 01:38:49,392 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:38:49,392 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:38:49,401 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9700, LAS: 0.9320, UEM: 0.8024, LEM: 0.5889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0914, partial_loss/deprel_loss: 0.2178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.5235, batch_reg_loss: 0.1948, reg_loss: 0.1948 ||: 3%|3 | 3/95 [00:02<01:16, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9558, LAS: 0.9185, UEM: 0.7202, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4417, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6787, loss: 0.6081, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 6%|6 | 6/95 [00:04<01:13, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9608, LAS: 0.9236, UEM: 0.7109, LEM: 0.4619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3048, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.5829, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 9%|9 | 9/95 [00:07<01:08, 1.25it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9621, LAS: 0.9253, UEM: 0.7227, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.2442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.5705, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 13%|#2 | 12/95 [00:09<01:03, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9590, LAS: 0.9226, UEM: 0.6710, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5053, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.5941, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 17%|#6 | 16/95 [00:11<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9601, LAS: 0.9239, UEM: 0.6670, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3350, partial_loss/deprel_loss: 0.3966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.5888, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 21%|##1 | 20/95 [00:14<00:51, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9612, LAS: 0.9254, UEM: 0.6634, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4431, partial_loss/deprel_loss: 0.4889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6745, loss: 0.5834, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 25%|##5 | 24/95 [00:16<00:47, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9598, LAS: 0.9239, UEM: 0.6607, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0689, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9496, loss: 0.5918, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 29%|##9 | 28/95 [00:18<00:42, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9590, LAS: 0.9234, UEM: 0.6451, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2733, partial_loss/deprel_loss: 0.3431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.5965, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 34%|###3 | 32/95 [00:20<00:37, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9580, LAS: 0.9230, UEM: 0.6245, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3928, partial_loss/deprel_loss: 0.3778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5755, loss: 0.6015, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 38%|###7 | 36/95 [00:23<00:36, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9593, LAS: 0.9242, UEM: 0.6439, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1932, partial_loss/deprel_loss: 0.2998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4732, loss: 0.5942, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 42%|####2 | 40/95 [00:26<00:35, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9601, LAS: 0.9250, UEM: 0.6481, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2105, partial_loss/deprel_loss: 0.3241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4961, loss: 0.5866, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||: 46%|####6 | 44/95 [00:28<00:32, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9606, LAS: 0.9257, UEM: 0.6478, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5097, partial_loss/deprel_loss: 0.4705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.5840, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 51%|##### | 48/95 [00:31<00:31, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9613, LAS: 0.9265, UEM: 0.6749, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1654, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.5765, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 55%|#####4 | 52/95 [00:35<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9619, LAS: 0.9270, UEM: 0.6761, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1565, partial_loss/deprel_loss: 0.2634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.5739, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 60%|###### | 57/95 [00:37<00:24, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9621, LAS: 0.9269, UEM: 0.6679, LEM: 0.4428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.4833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6617, loss: 0.5763, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 65%|######5 | 62/95 [00:39<00:19, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9616, LAS: 0.9263, UEM: 0.6622, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4189, partial_loss/deprel_loss: 0.4651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6504, loss: 0.5801, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 71%|####### | 67/95 [00:41<00:15, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9609, LAS: 0.9256, UEM: 0.6548, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5795, loss: 0.5847, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||: 75%|#######4 | 71/95 [00:44<00:13, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9612, LAS: 0.9259, UEM: 0.6641, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6663, partial_loss/deprel_loss: 0.5419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.5817, batch_reg_loss: 0.1945, reg_loss: 0.1947 ||: 79%|#######8 | 75/95 [00:49<00:15, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9612, LAS: 0.9259, UEM: 0.6713, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9395, partial_loss/deprel_loss: 0.6295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8860, loss: 0.5815, batch_reg_loss: 0.1945, reg_loss: 0.1947 ||: 83%|########3 | 79/95 [00:52<00:12, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9617, LAS: 0.9264, UEM: 0.6751, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.2679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4423, loss: 0.5777, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 86%|########6 | 82/95 [00:54<00:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9615, LAS: 0.9262, UEM: 0.6700, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4818, partial_loss/deprel_loss: 0.4349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6388, loss: 0.5791, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 89%|########9 | 85/95 [00:56<00:07, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9614, LAS: 0.9261, UEM: 0.6673, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1892, partial_loss/deprel_loss: 0.3540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5155, loss: 0.5804, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 94%|#########3| 89/95 [00:59<00:04, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9614, LAS: 0.9261, UEM: 0.6708, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3842, partial_loss/deprel_loss: 0.4363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.5801, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 97%|#########6| 92/95 [01:01<00:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9613, LAS: 0.9259, UEM: 0.6690, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4985, loss: 0.5819, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 100%|##########| 95/95 [01:03<00:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9613, LAS: 0.9259, UEM: 0.6690, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4985, loss: 0.5819, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 01:39:56,277 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:39:56,277 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - reg_loss | 0.195 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UEM | 0.669 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LEM | 0.447 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EM | 0.927 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.203 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.329 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - loss | 0.582 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:56,284 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:40:02,411 - INFO - combo.training.trainer - Epoch duration: 0:01:13.019938\n", + "2023-04-07 01:40:02,412 - INFO - combo.training.trainer - Estimated training time remaining: 4:50:12\n", + "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - Epoch 148/399\n", + "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:40:02,420 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9744, LAS: 0.9410, UEM: 0.7404, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1520, partial_loss/deprel_loss: 0.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4530, loss: 0.4921, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||: 3%|3 | 3/95 [00:02<01:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9688, LAS: 0.9367, UEM: 0.6836, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.2594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4398, loss: 0.5078, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||: 7%|7 | 7/95 [00:04<00:59, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9651, LAS: 0.9312, UEM: 0.7144, LEM: 0.4688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0441, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9223, loss: 0.5370, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||: 11%|# | 10/95 [00:07<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9626, LAS: 0.9289, UEM: 0.6773, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3531, partial_loss/deprel_loss: 0.4054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5894, loss: 0.5538, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||: 14%|#3 | 13/95 [00:09<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9644, LAS: 0.9311, UEM: 0.7024, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1947, partial_loss/deprel_loss: 0.2653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.5368, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||: 17%|#6 | 16/95 [00:11<01:00, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9654, LAS: 0.9322, UEM: 0.6880, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2423, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.5309, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||: 21%|##1 | 20/95 [00:14<00:53, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9655, LAS: 0.9318, UEM: 0.6834, LEM: 0.4356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.3251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.5338, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||: 25%|##5 | 24/95 [00:16<00:47, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9652, LAS: 0.9317, UEM: 0.6777, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1851, partial_loss/deprel_loss: 0.2392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4228, loss: 0.5354, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||: 28%|##8 | 27/95 [00:18<00:46, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9654, LAS: 0.9316, UEM: 0.6774, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6069, loss: 0.5384, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||: 32%|###1 | 30/95 [00:20<00:44, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9659, LAS: 0.9320, UEM: 0.6825, LEM: 0.4370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.4138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.5368, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||: 35%|###4 | 33/95 [00:22<00:42, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9649, LAS: 0.9308, UEM: 0.6832, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2323, partial_loss/deprel_loss: 0.5903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9130, loss: 0.5444, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||: 38%|###7 | 36/95 [00:24<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9635, LAS: 0.9291, UEM: 0.6664, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7926, partial_loss/deprel_loss: 0.5206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7694, loss: 0.5546, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 42%|####2 | 40/95 [00:27<00:36, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9640, LAS: 0.9295, UEM: 0.6878, LEM: 0.4542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0724, partial_loss/deprel_loss: 0.1789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3519, loss: 0.5502, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 46%|####6 | 44/95 [00:30<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9631, LAS: 0.9284, UEM: 0.6779, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.3649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5405, loss: 0.5579, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 49%|####9 | 47/95 [00:32<00:34, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9623, LAS: 0.9276, UEM: 0.6673, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2135, partial_loss/deprel_loss: 0.3543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5204, loss: 0.5629, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 54%|#####3 | 51/95 [00:35<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9622, LAS: 0.9275, UEM: 0.6637, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5394, partial_loss/deprel_loss: 0.4958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6988, loss: 0.5639, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 57%|#####6 | 54/95 [00:37<00:28, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9625, LAS: 0.9277, UEM: 0.6680, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.2777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.5613, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 61%|######1 | 58/95 [00:39<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9500, UAS: 0.9631, LAS: 0.9283, UEM: 0.6834, LEM: 0.4509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0752, partial_loss/deprel_loss: 0.2441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5568, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 64%|######4 | 61/95 [00:42<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9616, LAS: 0.9267, UEM: 0.6699, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8370, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.5667, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 68%|######8 | 65/95 [00:44<00:20, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9619, LAS: 0.9273, UEM: 0.6804, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0577, partial_loss/deprel_loss: 0.1130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2962, loss: 0.5648, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 74%|#######3 | 70/95 [00:47<00:15, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9621, LAS: 0.9274, UEM: 0.6767, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1719, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4349, loss: 0.5652, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||: 79%|#######8 | 75/95 [00:49<00:11, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9623, LAS: 0.9276, UEM: 0.6764, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6284, partial_loss/deprel_loss: 0.5133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.5645, batch_reg_loss: 0.1942, reg_loss: 0.1944 ||: 84%|########4 | 80/95 [00:51<00:08, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9615, LAS: 0.9268, UEM: 0.6698, LEM: 0.4466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5624, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.5706, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||: 88%|########8 | 84/95 [00:55<00:06, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9619, LAS: 0.9270, UEM: 0.6704, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.4192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.5695, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||: 93%|#########2| 88/95 [00:58<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9620, LAS: 0.9270, UEM: 0.6698, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6388, partial_loss/deprel_loss: 0.5363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7510, loss: 0.5693, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||: 97%|#########6| 92/95 [01:01<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9618, LAS: 0.9268, UEM: 0.6647, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6035, partial_loss/deprel_loss: 0.5098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7227, loss: 0.5714, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||: 100%|##########| 95/95 [01:03<00:00, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:41:08,690 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - reg_loss | 0.194 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UEM | 0.665 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - LEM | 0.438 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EM | 0.908 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.603 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.510 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - loss | 0.571 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:41:08,697 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:41:13,618 - INFO - combo.training.trainer - Epoch duration: 0:01:11.205192\n", + "2023-04-07 01:41:13,618 - INFO - combo.training.trainer - Estimated training time remaining: 4:49:06\n", + "2023-04-07 01:41:13,618 - INFO - allennlp.training.trainer - Epoch 149/399\n", + "2023-04-07 01:41:13,618 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:41:13,619 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:41:13,628 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9614, LAS: 0.9257, UEM: 0.6583, LEM: 0.4530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1289, partial_loss/deprel_loss: 0.2566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4253, loss: 0.5710, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||: 3%|3 | 3/95 [00:02<01:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9226, UEM: 0.5729, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.5999, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||: 6%|6 | 6/95 [00:04<01:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9594, LAS: 0.9240, UEM: 0.5481, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4907, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.6039, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||: 9%|9 | 9/95 [00:06<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9640, LAS: 0.9293, UEM: 0.6384, LEM: 0.3999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.2807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4500, loss: 0.5638, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||: 13%|#2 | 12/95 [00:08<01:02, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9641, LAS: 0.9295, UEM: 0.6795, LEM: 0.4486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2402, partial_loss/deprel_loss: 0.3336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5631, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||: 16%|#5 | 15/95 [00:11<00:59, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9641, LAS: 0.9299, UEM: 0.6658, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4784, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6541, loss: 0.5623, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||: 19%|#8 | 18/95 [00:13<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9644, LAS: 0.9301, UEM: 0.6699, LEM: 0.4357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.2600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4309, loss: 0.5605, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||: 22%|##2 | 21/95 [00:15<00:55, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9627, LAS: 0.9285, UEM: 0.6464, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4797, partial_loss/deprel_loss: 0.4261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6309, loss: 0.5696, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||: 25%|##5 | 24/95 [00:17<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9632, LAS: 0.9292, UEM: 0.6490, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5631, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||: 28%|##8 | 27/95 [00:19<00:50, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9637, LAS: 0.9297, UEM: 0.6502, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.3734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5640, loss: 0.5609, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||: 32%|###1 | 30/95 [00:22<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9633, LAS: 0.9293, UEM: 0.6401, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2135, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5665, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 35%|###4 | 33/95 [00:24<00:44, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9615, LAS: 0.9274, UEM: 0.6421, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1411, partial_loss/deprel_loss: 0.2652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5764, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 38%|###7 | 36/95 [00:26<00:42, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9622, LAS: 0.9280, UEM: 0.6450, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3323, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.5730, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 42%|####2 | 40/95 [00:28<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9625, LAS: 0.9282, UEM: 0.6431, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2572, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5720, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 45%|####5 | 43/95 [00:30<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9626, LAS: 0.9281, UEM: 0.6375, LEM: 0.3997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.2949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4676, loss: 0.5702, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||: 49%|####9 | 47/95 [00:33<00:32, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9620, LAS: 0.9276, UEM: 0.6397, LEM: 0.4051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1029, partial_loss/deprel_loss: 0.2344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4021, loss: 0.5730, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 53%|#####2 | 50/95 [00:35<00:31, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9628, LAS: 0.9284, UEM: 0.6473, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4910, loss: 0.5673, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9627, LAS: 0.9284, UEM: 0.6482, LEM: 0.4126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1409, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.5673, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 59%|#####8 | 56/95 [00:40<00:28, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9618, LAS: 0.9274, UEM: 0.6350, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5930, partial_loss/deprel_loss: 0.5383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.5728, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 63%|######3 | 60/95 [00:42<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9623, LAS: 0.9279, UEM: 0.6453, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.3706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.5693, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 66%|######6 | 63/95 [00:44<00:22, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9612, LAS: 0.9269, UEM: 0.6377, LEM: 0.4055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4288, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.5769, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 69%|######9 | 66/95 [00:47<00:21, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9612, LAS: 0.9269, UEM: 0.6398, LEM: 0.4071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2262, partial_loss/deprel_loss: 0.3117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5758, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 73%|#######2 | 69/95 [00:49<00:19, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9622, LAS: 0.9279, UEM: 0.6668, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1521, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4982, loss: 0.5689, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 76%|#######5 | 72/95 [00:52<00:18, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9618, LAS: 0.9275, UEM: 0.6608, LEM: 0.4356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6352, partial_loss/deprel_loss: 0.4216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.5719, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 79%|#######8 | 75/95 [00:54<00:15, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9614, LAS: 0.9270, UEM: 0.6562, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3477, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6083, loss: 0.5751, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||: 82%|########2 | 78/95 [00:56<00:12, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9613, LAS: 0.9269, UEM: 0.6668, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0557, partial_loss/deprel_loss: 0.1716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3424, loss: 0.5738, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||: 86%|########6 | 82/95 [00:58<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9614, LAS: 0.9270, UEM: 0.6651, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5314, loss: 0.5739, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||: 92%|#########1| 87/95 [01:01<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9620, LAS: 0.9275, UEM: 0.6744, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1524, partial_loss/deprel_loss: 0.2935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4592, loss: 0.5696, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||: 96%|#########5| 91/95 [01:04<00:02, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9619, LAS: 0.9274, UEM: 0.6710, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1426, partial_loss/deprel_loss: 0.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4658, loss: 0.5702, batch_reg_loss: 0.1939, reg_loss: 0.1940 ||: 100%|##########| 95/95 [01:06<00:00, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9619, LAS: 0.9274, UEM: 0.6710, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1426, partial_loss/deprel_loss: 0.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4658, loss: 0.5702, batch_reg_loss: 0.1939, reg_loss: 0.1940 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - reg_loss | 0.194 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UEM | 0.671 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - LEM | 0.445 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EM | 0.941 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.143 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.304 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - loss | 0.570 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:42:23,405 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:42:30,545 - INFO - combo.training.trainer - Epoch duration: 0:01:16.926598\n", + "2023-04-07 01:42:30,545 - INFO - combo.training.trainer - Estimated training time remaining: 4:48:10\n", + "2023-04-07 01:42:30,546 - INFO - allennlp.training.trainer - Epoch 150/399\n", + "2023-04-07 01:42:30,546 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:42:30,547 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:42:30,557 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9660, LAS: 0.9301, UEM: 0.7472, LEM: 0.5735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.5159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7171, loss: 0.5174, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||: 3%|3 | 3/95 [00:02<01:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9654, LAS: 0.9296, UEM: 0.7582, LEM: 0.5888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3937, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.5311, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||: 6%|6 | 6/95 [00:04<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9632, LAS: 0.9271, UEM: 0.7234, LEM: 0.5403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5025, partial_loss/deprel_loss: 0.3931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6089, loss: 0.5487, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||: 9%|9 | 9/95 [00:06<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9621, LAS: 0.9274, UEM: 0.6765, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6303, partial_loss/deprel_loss: 0.4333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6665, loss: 0.5548, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||: 14%|#3 | 13/95 [00:08<00:56, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9601, LAS: 0.9255, UEM: 0.6530, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5703, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||: 18%|#7 | 17/95 [00:11<00:52, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9610, LAS: 0.9265, UEM: 0.6526, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2210, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.5622, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||: 21%|##1 | 20/95 [00:13<00:51, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9602, LAS: 0.9258, UEM: 0.6538, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.5697, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||: 24%|##4 | 23/95 [00:16<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9603, LAS: 0.9256, UEM: 0.6631, LEM: 0.4543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0864, partial_loss/deprel_loss: 0.2300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3951, loss: 0.5738, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||: 27%|##7 | 26/95 [00:18<00:49, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9601, LAS: 0.9251, UEM: 0.6614, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1643, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4691, loss: 0.5745, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||: 32%|###1 | 30/95 [00:21<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9614, LAS: 0.9263, UEM: 0.6774, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1403, partial_loss/deprel_loss: 0.2896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4535, loss: 0.5672, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 35%|###4 | 33/95 [00:23<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9606, LAS: 0.9259, UEM: 0.6663, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2420, partial_loss/deprel_loss: 0.2978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4805, loss: 0.5706, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 39%|###8 | 37/95 [00:26<00:41, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9610, LAS: 0.9263, UEM: 0.6568, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.5693, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 43%|####3 | 41/95 [00:28<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9607, LAS: 0.9261, UEM: 0.6518, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4473, loss: 0.5723, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 46%|####6 | 44/95 [00:31<00:37, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9613, LAS: 0.9269, UEM: 0.6689, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5654, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 49%|####9 | 47/95 [00:33<00:37, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9617, LAS: 0.9273, UEM: 0.6746, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1656, partial_loss/deprel_loss: 0.2683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.5625, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 53%|#####2 | 50/95 [00:35<00:34, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9613, LAS: 0.9269, UEM: 0.6674, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6161, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6700, loss: 0.5647, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||: 56%|#####5 | 53/95 [00:38<00:31, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9611, LAS: 0.9265, UEM: 0.6608, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5683, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 59%|#####8 | 56/95 [00:40<00:28, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9602, LAS: 0.9257, UEM: 0.6464, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.5758, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 63%|######3 | 60/95 [00:42<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9752, UAS: 0.9611, LAS: 0.9269, UEM: 0.6718, LEM: 0.4589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.1154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2911, loss: 0.5690, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 66%|######6 | 63/95 [00:44<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9618, LAS: 0.9275, UEM: 0.6753, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4824, loss: 0.5649, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 71%|####### | 67/95 [00:47<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9622, LAS: 0.9279, UEM: 0.6779, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1592, partial_loss/deprel_loss: 0.2677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.5626, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 74%|#######3 | 70/95 [00:49<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9623, LAS: 0.9279, UEM: 0.6740, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4977, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6419, loss: 0.5636, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 77%|#######6 | 73/95 [00:51<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9624, LAS: 0.9278, UEM: 0.6712, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2408, partial_loss/deprel_loss: 0.3397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5636, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 80%|######## | 76/95 [00:54<00:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9630, LAS: 0.9283, UEM: 0.6791, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1598, partial_loss/deprel_loss: 0.2910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4584, loss: 0.5600, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||: 84%|########4 | 80/95 [00:57<00:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9628, LAS: 0.9281, UEM: 0.6764, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1033, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4181, loss: 0.5623, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||: 88%|########8 | 84/95 [00:59<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9625, LAS: 0.9277, UEM: 0.6714, LEM: 0.4459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5945, partial_loss/deprel_loss: 0.5072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7183, loss: 0.5645, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||: 93%|#########2| 88/95 [01:02<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9626, LAS: 0.9278, UEM: 0.6743, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1555, partial_loss/deprel_loss: 0.2837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.5638, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||: 97%|#########6| 92/95 [01:04<00:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9623, LAS: 0.9275, UEM: 0.6714, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5079, loss: 0.5658, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 01:43:40,329 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9546, LAS: 0.9034, UEM: 0.6531, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5055, partial_loss/deprel_loss: 7.8762, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4020, loss: 6.6940, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:06, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9639, LAS: 0.9178, UEM: 0.7926, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2003, partial_loss/deprel_loss: 5.6713, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5771, loss: 5.6320, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.10it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9541, LAS: 0.9039, UEM: 0.7210, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6134, partial_loss/deprel_loss: 7.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7700, loss: 7.5659, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9517, LAS: 0.9005, UEM: 0.6847, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2930, partial_loss/deprel_loss: 16.4667, partial_loss/cycle_loss: 0.0000, batch_loss: 13.4320, loss: 8.1682, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00, 1.13it/s]\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - reg_loss | 0.194 | 0.000\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UEM | 0.671 | 0.685\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - LEM | 0.446 | 0.412\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EM | 0.941 | 0.879\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.177 | 1.293\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | 0.952\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.349 | 16.467\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - loss | 0.566 | 8.168\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | 0.901\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:43:50,113 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:44:00,106 - INFO - combo.training.trainer - Epoch duration: 0:01:29.560242\n", + "2023-04-07 01:44:00,107 - INFO - combo.training.trainer - Estimated training time remaining: 4:47:35\n", + "2023-04-07 01:44:00,107 - INFO - allennlp.training.trainer - Epoch 151/399\n", + "2023-04-07 01:44:00,107 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:44:00,108 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:44:00,117 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9609, LAS: 0.9235, UEM: 0.7176, LEM: 0.5126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1536, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4459, loss: 0.5892, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 3%|3 | 3/95 [00:02<01:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9565, LAS: 0.9205, UEM: 0.6866, LEM: 0.4729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1358, partial_loss/deprel_loss: 0.3196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4764, loss: 0.6192, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 6%|6 | 6/95 [00:04<01:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9518, LAS: 0.9166, UEM: 0.6304, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6188, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.6535, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 11%|# | 10/95 [00:06<00:59, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9565, LAS: 0.9215, UEM: 0.6676, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.6097, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 14%|#3 | 13/95 [00:09<01:02, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9595, LAS: 0.9243, UEM: 0.6698, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3932, partial_loss/deprel_loss: 0.3966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.5908, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 18%|#7 | 17/95 [00:12<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9597, LAS: 0.9247, UEM: 0.6644, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6641, partial_loss/deprel_loss: 0.4789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7095, loss: 0.5852, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 22%|##2 | 21/95 [00:14<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9596, LAS: 0.9243, UEM: 0.6369, LEM: 0.3989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4559, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.5890, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||: 26%|##6 | 25/95 [00:17<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9590, LAS: 0.9236, UEM: 0.6199, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3745, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 0.5937, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 29%|##9 | 28/95 [00:19<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9586, LAS: 0.9238, UEM: 0.6553, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6416, partial_loss/deprel_loss: 0.4670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6955, loss: 0.5927, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 33%|###2 | 31/95 [00:22<00:47, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9587, LAS: 0.9240, UEM: 0.6528, LEM: 0.4421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3300, partial_loss/deprel_loss: 0.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5537, loss: 0.5907, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 36%|###5 | 34/95 [00:24<00:44, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9604, LAS: 0.9261, UEM: 0.6791, LEM: 0.4685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0871, partial_loss/deprel_loss: 0.2256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3914, loss: 0.5778, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 39%|###8 | 37/95 [00:26<00:43, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9611, LAS: 0.9269, UEM: 0.6815, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2208, partial_loss/deprel_loss: 0.2999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4777, loss: 0.5705, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 42%|####2 | 40/95 [00:28<00:41, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9615, LAS: 0.9275, UEM: 0.6845, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2482, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.5650, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 45%|####5 | 43/95 [00:31<00:39, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9613, LAS: 0.9272, UEM: 0.6755, LEM: 0.4621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6375, loss: 0.5672, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 48%|####8 | 46/95 [00:33<00:36, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9618, LAS: 0.9277, UEM: 0.6789, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1184, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.5634, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||: 52%|#####1 | 49/95 [00:35<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9611, LAS: 0.9270, UEM: 0.6670, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3595, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.5680, batch_reg_loss: 0.1935, reg_loss: 0.1935 ||: 56%|#####5 | 53/95 [00:37<00:28, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9618, LAS: 0.9271, UEM: 0.6702, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.5663, batch_reg_loss: 0.1935, reg_loss: 0.1935 ||: 60%|###### | 57/95 [00:40<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9626, LAS: 0.9279, UEM: 0.6817, LEM: 0.4618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1669, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.5599, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 64%|######4 | 61/95 [00:43<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9627, LAS: 0.9279, UEM: 0.6785, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4057, partial_loss/deprel_loss: 0.3609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.5593, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 67%|######7 | 64/95 [00:45<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9617, LAS: 0.9270, UEM: 0.6698, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.4235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.5659, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 72%|#######1 | 68/95 [00:47<00:18, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9620, LAS: 0.9274, UEM: 0.6724, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4837, partial_loss/deprel_loss: 0.4864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.5645, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 75%|#######4 | 71/95 [00:49<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9623, LAS: 0.9278, UEM: 0.6786, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0840, partial_loss/deprel_loss: 0.1542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3335, loss: 0.5623, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 79%|#######8 | 75/95 [00:52<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9620, LAS: 0.9274, UEM: 0.6722, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.4788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.5649, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 82%|########2 | 78/95 [00:54<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9621, LAS: 0.9276, UEM: 0.6706, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2036, partial_loss/deprel_loss: 0.3381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.5636, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 86%|########6 | 82/95 [00:57<00:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9627, LAS: 0.9281, UEM: 0.6791, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1542, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4650, loss: 0.5601, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 91%|######### | 86/95 [00:59<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9629, LAS: 0.9283, UEM: 0.6831, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3320, partial_loss/deprel_loss: 0.4114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5889, loss: 0.5585, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||: 94%|#########3| 89/95 [01:02<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9621, LAS: 0.9273, UEM: 0.6730, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7520, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7576, loss: 0.5648, batch_reg_loss: 0.1933, reg_loss: 0.1935 ||: 98%|#########7| 93/95 [01:04<00:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9617, LAS: 0.9269, UEM: 0.6690, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4188, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6760, loss: 0.5690, batch_reg_loss: 0.1933, reg_loss: 0.1935 ||: 100%|##########| 95/95 [01:05<00:00, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:45:08,431 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - reg_loss | 0.193 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UEM | 0.669 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - LEM | 0.449 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EM | 0.919 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.419 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.499 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - loss | 0.569 | N/A\n", + "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:08,437 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:45:13,292 - INFO - combo.training.trainer - Epoch duration: 0:01:13.185240\n", + "2023-04-07 01:45:13,293 - INFO - combo.training.trainer - Estimated training time remaining: 4:46:32\n", + "2023-04-07 01:45:13,293 - INFO - allennlp.training.trainer - Epoch 152/399\n", + "2023-04-07 01:45:13,293 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:45:13,294 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:45:13,303 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9648, LAS: 0.9306, UEM: 0.6706, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2947, partial_loss/deprel_loss: 0.3594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5398, loss: 0.5604, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 5%|5 | 5/95 [00:02<00:42, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9627, LAS: 0.9267, UEM: 0.6190, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5120, loss: 0.5719, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 11%|# | 10/95 [00:04<00:40, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9643, LAS: 0.9288, UEM: 0.7303, LEM: 0.5263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3319, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5923, loss: 0.5558, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 15%|#4 | 14/95 [00:06<00:39, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9645, LAS: 0.9296, UEM: 0.7163, LEM: 0.5095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3716, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5503, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 19%|#8 | 18/95 [00:09<00:39, 1.96it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9622, LAS: 0.9271, UEM: 0.6931, LEM: 0.4872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6067, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7263, loss: 0.5661, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 22%|##2 | 21/95 [00:11<00:43, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9607, LAS: 0.9260, UEM: 0.6901, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.2290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.5708, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 25%|##5 | 24/95 [00:13<00:44, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9553, UAS: 0.9600, LAS: 0.9256, UEM: 0.6950, LEM: 0.4992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0893, partial_loss/deprel_loss: 0.1721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.5732, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 29%|##9 | 28/95 [00:16<00:42, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9614, LAS: 0.9271, UEM: 0.7062, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2809, partial_loss/deprel_loss: 0.3315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.5640, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 33%|###2 | 31/95 [00:18<00:43, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9608, LAS: 0.9264, UEM: 0.6887, LEM: 0.4898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5052, partial_loss/deprel_loss: 0.4907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6869, loss: 0.5703, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 36%|###5 | 34/95 [00:20<00:41, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9273, UEM: 0.6921, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3621, partial_loss/deprel_loss: 0.3911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.5651, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||: 39%|###8 | 37/95 [00:22<00:39, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9620, LAS: 0.9275, UEM: 0.6851, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4416, partial_loss/deprel_loss: 0.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6666, loss: 0.5657, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 43%|####3 | 41/95 [00:24<00:34, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9630, LAS: 0.9288, UEM: 0.6947, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1287, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4019, loss: 0.5575, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 47%|####7 | 45/95 [00:27<00:33, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9638, LAS: 0.9297, UEM: 0.7002, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.2813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4458, loss: 0.5526, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 51%|##### | 48/95 [00:30<00:33, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9637, LAS: 0.9294, UEM: 0.6944, LEM: 0.4783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4207, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6260, loss: 0.5551, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 54%|#####3 | 51/95 [00:32<00:30, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9633, LAS: 0.9287, UEM: 0.6831, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.5592, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 58%|#####7 | 55/95 [00:34<00:26, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9632, LAS: 0.9287, UEM: 0.6790, LEM: 0.4609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3341, partial_loss/deprel_loss: 0.4006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5805, loss: 0.5607, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 62%|######2 | 59/95 [00:37<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9622, LAS: 0.9275, UEM: 0.6744, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1663, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.5681, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 66%|######6 | 63/95 [00:40<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9627, LAS: 0.9281, UEM: 0.6756, LEM: 0.4548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2209, partial_loss/deprel_loss: 0.3555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.5650, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 71%|####### | 67/95 [00:42<00:18, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9632, LAS: 0.9286, UEM: 0.6861, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0724, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3649, loss: 0.5610, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||: 75%|#######4 | 71/95 [00:45<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9633, LAS: 0.9287, UEM: 0.6829, LEM: 0.4647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0953, partial_loss/deprel_loss: 0.2526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4142, loss: 0.5609, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 79%|#######8 | 75/95 [00:48<00:13, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9632, LAS: 0.9287, UEM: 0.6810, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3365, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5611, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 82%|########2 | 78/95 [00:50<00:12, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9635, LAS: 0.9291, UEM: 0.6777, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2915, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5593, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 86%|########6 | 82/95 [00:53<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9630, LAS: 0.9285, UEM: 0.6734, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2280, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.5626, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 89%|########9 | 85/95 [00:55<00:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9631, LAS: 0.9287, UEM: 0.6759, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4389, loss: 0.5614, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 93%|#########2| 88/95 [00:57<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9633, LAS: 0.9287, UEM: 0.6769, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.5614, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 97%|#########6| 92/95 [00:59<00:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9630, LAS: 0.9284, UEM: 0.6751, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5550, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.5642, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 100%|##########| 95/95 [01:01<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9630, LAS: 0.9284, UEM: 0.6751, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5550, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.5642, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 100%|##########| 95/95 [01:01<00:00, 1.53it/s]\n", + "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer - reg_loss | 0.193 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UEM | 0.675 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - LEM | 0.453 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EM | 0.907 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.555 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.550 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - loss | 0.564 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:18,484 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:46:23,248 - INFO - combo.training.trainer - Epoch duration: 0:01:09.955236\n", + "2023-04-07 01:46:23,249 - INFO - combo.training.trainer - Estimated training time remaining: 4:45:23\n", + "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - Epoch 153/399\n", + "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:46:23,258 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9771, LAS: 0.9493, UEM: 0.8953, LEM: 0.7781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.4343, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||: 3%|3 | 3/95 [00:02<01:22, 1.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9711, LAS: 0.9399, UEM: 0.8135, LEM: 0.6574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4392, loss: 0.4993, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||: 6%|6 | 6/95 [00:04<01:15, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9663, LAS: 0.9337, UEM: 0.7370, LEM: 0.5718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2946, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.5429, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||: 9%|9 | 9/95 [00:07<01:10, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9677, LAS: 0.9344, UEM: 0.7167, LEM: 0.5239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2023, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5343, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||: 14%|#3 | 13/95 [00:09<01:02, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9664, LAS: 0.9334, UEM: 0.6901, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4230, partial_loss/deprel_loss: 0.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6081, loss: 0.5385, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||: 17%|#6 | 16/95 [00:11<00:58, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9642, LAS: 0.9310, UEM: 0.6634, LEM: 0.4599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1400, partial_loss/deprel_loss: 0.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4171, loss: 0.5492, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||: 22%|##2 | 21/95 [00:13<00:48, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9628, LAS: 0.9295, UEM: 0.6412, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5040, partial_loss/deprel_loss: 0.4501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.5579, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||: 27%|##7 | 26/95 [00:16<00:40, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9631, LAS: 0.9300, UEM: 0.6525, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5518, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 33%|###2 | 31/95 [00:18<00:34, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9615, LAS: 0.9284, UEM: 0.6319, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4570, partial_loss/deprel_loss: 0.4195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6200, loss: 0.5611, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 37%|###6 | 35/95 [00:20<00:33, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9614, LAS: 0.9283, UEM: 0.6278, LEM: 0.4211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1774, partial_loss/deprel_loss: 0.3100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4765, loss: 0.5609, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 41%|####1 | 39/95 [00:23<00:32, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9606, LAS: 0.9271, UEM: 0.6268, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5077, partial_loss/deprel_loss: 0.4792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.5675, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 45%|####5 | 43/95 [00:26<00:33, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9603, LAS: 0.9268, UEM: 0.6262, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1813, partial_loss/deprel_loss: 0.2470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5698, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 49%|####9 | 47/95 [00:29<00:32, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9617, LAS: 0.9280, UEM: 0.6514, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1773, partial_loss/deprel_loss: 0.3006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4689, loss: 0.5614, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 54%|#####3 | 51/95 [00:32<00:31, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9622, LAS: 0.9285, UEM: 0.6540, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.5598, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 58%|#####7 | 55/95 [00:35<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9628, LAS: 0.9291, UEM: 0.6585, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4259, loss: 0.5565, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||: 61%|######1 | 58/95 [00:37<00:26, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9635, LAS: 0.9298, UEM: 0.6767, LEM: 0.4580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0988, partial_loss/deprel_loss: 0.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5503, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 64%|######4 | 61/95 [00:39<00:25, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9638, LAS: 0.9301, UEM: 0.6752, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2344, partial_loss/deprel_loss: 0.3192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4952, loss: 0.5482, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 67%|######7 | 64/95 [00:42<00:22, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9635, LAS: 0.9300, UEM: 0.6734, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.5022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7306, loss: 0.5498, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 71%|####### | 67/95 [00:44<00:20, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9638, LAS: 0.9303, UEM: 0.6732, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.5486, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 74%|#######3 | 70/95 [00:46<00:18, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9635, LAS: 0.9300, UEM: 0.6789, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0780, partial_loss/deprel_loss: 0.1876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3586, loss: 0.5509, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 77%|#######6 | 73/95 [00:48<00:16, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9635, LAS: 0.9299, UEM: 0.6765, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.5520, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 81%|########1 | 77/95 [00:51<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9631, LAS: 0.9294, UEM: 0.6768, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1478, partial_loss/deprel_loss: 0.2834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.5553, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 84%|########4 | 80/95 [00:53<00:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9628, LAS: 0.9291, UEM: 0.6762, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4103, loss: 0.5563, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||: 87%|########7 | 83/95 [00:55<00:08, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9632, LAS: 0.9295, UEM: 0.6797, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3616, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.5544, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 92%|#########1| 87/95 [00:58<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9625, LAS: 0.9287, UEM: 0.6712, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9480, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8416, loss: 0.5597, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 96%|#########5| 91/95 [01:00<00:02, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9624, LAS: 0.9286, UEM: 0.6717, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.5606, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 100%|##########| 95/95 [01:03<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9624, LAS: 0.9286, UEM: 0.6717, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.5606, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 100%|##########| 95/95 [01:03<00:00, 1.49it/s]\n", + "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - reg_loss | 0.193 | N/A\n", + "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UEM | 0.672 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LEM | 0.454 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - EM | 0.911 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.595 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.483 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - loss | 0.561 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:29,983 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:47:34,665 - INFO - combo.training.trainer - Epoch duration: 0:01:11.416434\n", + "2023-04-07 01:47:34,666 - INFO - combo.training.trainer - Estimated training time remaining: 4:44:17\n", + "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - Epoch 154/399\n", + "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:47:34,675 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9608, LAS: 0.9279, UEM: 0.7436, LEM: 0.5331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5443, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 3%|3 | 3/95 [00:02<01:10, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9662, LAS: 0.9326, UEM: 0.7900, LEM: 0.6003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4828, loss: 0.5179, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 6%|6 | 6/95 [00:04<01:05, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9690, LAS: 0.9349, UEM: 0.7779, LEM: 0.5632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.5133, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 11%|# | 10/95 [00:06<00:59, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9673, LAS: 0.9324, UEM: 0.7386, LEM: 0.5174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5392, loss: 0.5312, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 14%|#3 | 13/95 [00:08<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9652, LAS: 0.9304, UEM: 0.6980, LEM: 0.4796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4147, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6004, loss: 0.5489, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 18%|#7 | 17/95 [00:11<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9644, LAS: 0.9295, UEM: 0.6804, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.4568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6867, loss: 0.5554, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 22%|##2 | 21/95 [00:13<00:49, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9657, LAS: 0.9310, UEM: 0.7083, LEM: 0.4953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1441, partial_loss/deprel_loss: 0.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5453, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 25%|##5 | 24/95 [00:16<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9670, LAS: 0.9332, UEM: 0.7441, LEM: 0.5471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3460, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.5323, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 28%|##8 | 27/95 [00:18<00:50, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9672, LAS: 0.9335, UEM: 0.7319, LEM: 0.5283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.3813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5772, loss: 0.5337, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||: 33%|###2 | 31/95 [00:21<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9652, LAS: 0.9320, UEM: 0.7065, LEM: 0.5027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5752, loss: 0.5440, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 38%|###7 | 36/95 [00:23<00:37, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9648, LAS: 0.9312, UEM: 0.6991, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.5251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7397, loss: 0.5485, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 43%|####3 | 41/95 [00:26<00:31, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9652, LAS: 0.9317, UEM: 0.6909, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3004, partial_loss/deprel_loss: 0.3089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.5428, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 48%|####8 | 46/95 [00:28<00:26, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9654, LAS: 0.9319, UEM: 0.6949, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1893, partial_loss/deprel_loss: 0.3457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.5413, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 54%|#####3 | 51/95 [00:30<00:23, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8626, UAS: 0.9645, LAS: 0.9307, UEM: 0.6942, LEM: 0.4826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0792, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9278, loss: 0.5480, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 58%|#####7 | 55/95 [00:33<00:22, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9643, LAS: 0.9303, UEM: 0.6942, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1887, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5500, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||: 62%|######2 | 59/95 [00:36<00:22, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9348, UAS: 0.9645, LAS: 0.9304, UEM: 0.6892, LEM: 0.4732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5398, loss: 0.5500, batch_reg_loss: 0.1927, reg_loss: 0.1927 ||: 66%|######6 | 63/95 [00:38<00:19, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9643, LAS: 0.9301, UEM: 0.6898, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1419, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4562, loss: 0.5522, batch_reg_loss: 0.1927, reg_loss: 0.1927 ||: 71%|####### | 67/95 [00:41<00:18, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9643, LAS: 0.9300, UEM: 0.6867, LEM: 0.4705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5519, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 75%|#######4 | 71/95 [00:44<00:16, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9632, LAS: 0.9289, UEM: 0.6760, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.4756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 0.5604, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 79%|#######8 | 75/95 [00:47<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9629, LAS: 0.9287, UEM: 0.6774, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7689, partial_loss/deprel_loss: 0.5712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8034, loss: 0.5623, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 82%|########2 | 78/95 [00:49<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9284, UEM: 0.6756, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.3204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5640, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 85%|########5 | 81/95 [00:51<00:10, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9622, LAS: 0.9280, UEM: 0.6737, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4916, loss: 0.5692, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 88%|########8 | 84/95 [00:53<00:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9624, LAS: 0.9282, UEM: 0.6741, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6484, partial_loss/deprel_loss: 0.4866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.5675, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 93%|#########2| 88/95 [00:56<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9625, LAS: 0.9283, UEM: 0.6744, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3919, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6571, loss: 0.5661, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 96%|#########5| 91/95 [00:58<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9627, LAS: 0.9284, UEM: 0.6749, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1751, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5655, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 99%|#########8| 94/95 [01:00<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9626, LAS: 0.9282, UEM: 0.6726, LEM: 0.4536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5320, partial_loss/deprel_loss: 0.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.5662, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 01:48:39,035 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - reg_loss | 0.193 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UEM | 0.673 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - LEM | 0.454 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EM | 0.909 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.532 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.420 | N/A\n", + "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - loss | 0.566 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:48:39,042 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:48:43,859 - INFO - combo.training.trainer - Epoch duration: 0:01:09.193646\n", + "2023-04-07 01:48:43,860 - INFO - combo.training.trainer - Estimated training time remaining: 4:43:08\n", + "2023-04-07 01:48:43,860 - INFO - allennlp.training.trainer - Epoch 155/399\n", + "2023-04-07 01:48:43,860 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:48:43,861 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:48:43,870 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9608, LAS: 0.9276, UEM: 0.6483, LEM: 0.4555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.5914, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 3%|3 | 3/95 [00:02<01:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9570, LAS: 0.9259, UEM: 0.5925, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5579, partial_loss/deprel_loss: 0.4107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6328, loss: 0.6037, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 6%|6 | 6/95 [00:04<01:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9636, LAS: 0.9320, UEM: 0.6805, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1039, partial_loss/deprel_loss: 0.2436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5590, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 9%|9 | 9/95 [00:06<01:04, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9625, LAS: 0.9313, UEM: 0.6726, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2871, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5166, loss: 0.5573, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 13%|#2 | 12/95 [00:08<01:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9631, LAS: 0.9307, UEM: 0.6691, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6312, partial_loss/deprel_loss: 0.4830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7052, loss: 0.5559, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 17%|#6 | 16/95 [00:11<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9641, LAS: 0.9316, UEM: 0.6668, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 0.3047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4812, loss: 0.5485, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 21%|##1 | 20/95 [00:14<00:53, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9643, LAS: 0.9317, UEM: 0.6792, LEM: 0.4498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0868, partial_loss/deprel_loss: 0.2085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3767, loss: 0.5462, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||: 24%|##4 | 23/95 [00:16<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9637, LAS: 0.9306, UEM: 0.6644, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6151, loss: 0.5520, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 27%|##7 | 26/95 [00:18<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9629, LAS: 0.9300, UEM: 0.6600, LEM: 0.4311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1871, partial_loss/deprel_loss: 0.2694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4455, loss: 0.5526, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 31%|### | 29/95 [00:21<00:48, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9623, LAS: 0.9295, UEM: 0.6463, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.3682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.5559, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 34%|###3 | 32/95 [00:23<00:45, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9624, LAS: 0.9296, UEM: 0.6430, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.5559, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 37%|###6 | 35/95 [00:25<00:43, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9633, LAS: 0.9307, UEM: 0.6570, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2356, partial_loss/deprel_loss: 0.2285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4224, loss: 0.5459, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 40%|#### | 38/95 [00:27<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9634, LAS: 0.9309, UEM: 0.6660, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6523, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.5447, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 43%|####3 | 41/95 [00:29<00:40, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9628, LAS: 0.9300, UEM: 0.6541, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4980, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6833, loss: 0.5498, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||: 47%|####7 | 45/95 [00:32<00:35, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9621, LAS: 0.9292, UEM: 0.6542, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1845, partial_loss/deprel_loss: 0.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.5548, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||: 51%|##### | 48/95 [00:34<00:33, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9628, LAS: 0.9295, UEM: 0.6600, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2775, partial_loss/deprel_loss: 0.4158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5806, loss: 0.5522, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||: 54%|#####3 | 51/95 [00:36<00:31, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9618, LAS: 0.9283, UEM: 0.6547, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4740, partial_loss/deprel_loss: 0.4610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6561, loss: 0.5598, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||: 58%|#####7 | 55/95 [00:38<00:26, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9617, LAS: 0.9282, UEM: 0.6626, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8209, partial_loss/deprel_loss: 0.5248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7765, loss: 0.5588, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||: 62%|######2 | 59/95 [00:41<00:22, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9619, LAS: 0.9282, UEM: 0.6584, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1698, partial_loss/deprel_loss: 0.2726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4445, loss: 0.5606, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 66%|######6 | 63/95 [00:43<00:19, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9624, LAS: 0.9287, UEM: 0.6644, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2067, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4279, loss: 0.5565, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 71%|####### | 67/95 [00:45<00:16, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9623, LAS: 0.9285, UEM: 0.6710, LEM: 0.4432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1447, partial_loss/deprel_loss: 0.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5571, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 75%|#######4 | 71/95 [00:48<00:15, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9626, LAS: 0.9289, UEM: 0.6697, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2112, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4712, loss: 0.5544, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 79%|#######8 | 75/95 [00:51<00:13, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9631, LAS: 0.9293, UEM: 0.6757, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1953, partial_loss/deprel_loss: 0.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.5512, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 83%|########3 | 79/95 [00:53<00:09, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9625, LAS: 0.9286, UEM: 0.6716, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2198, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4642, loss: 0.5562, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 87%|########7 | 83/95 [00:55<00:07, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9624, LAS: 0.9285, UEM: 0.6668, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5571, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 93%|#########2| 88/95 [00:57<00:03, 1.82it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9621, LAS: 0.9281, UEM: 0.6598, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5084, partial_loss/deprel_loss: 0.4923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.5596, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 97%|#########6| 92/95 [01:00<00:01, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9622, LAS: 0.9282, UEM: 0.6700, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6357, partial_loss/deprel_loss: 0.5351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.5587, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 01:49:49,763 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9701, LAS: 0.9299, UEM: 0.8368, LEM: 0.6131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3931, partial_loss/deprel_loss: 6.0986, partial_loss/cycle_loss: 0.0000, batch_loss: 4.9575, loss: 4.9463, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9506, LAS: 0.9037, UEM: 0.7416, LEM: 0.5267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6095, partial_loss/deprel_loss: 18.9605, partial_loss/cycle_loss: 0.0000, batch_loss: 15.4903, loss: 8.5861, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 45%|####5 | 5/11 [00:04<00:05, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9530, LAS: 0.9025, UEM: 0.7042, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4562, partial_loss/deprel_loss: 7.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1145, loss: 7.8166, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:07<00:02, 1.08it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9512, LAS: 0.9002, UEM: 0.6878, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 5.5646, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4954, loss: 7.7988, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9512, LAS: 0.9002, UEM: 0.6878, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 5.5646, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4954, loss: 7.7988, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.04it/s]\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | 0.000\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - UEM | 0.670 | 0.688\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LEM | 0.446 | 0.421\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - EM | 0.902 | 0.935\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.636 | 0.218\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | 0.951\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.535 | 5.565\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - loss | 0.559 | 7.799\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | 0.900\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:50:00,320 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:50:04,527 - INFO - combo.training.trainer - Epoch duration: 0:01:20.667316\n", + "2023-04-07 01:50:04,528 - INFO - combo.training.trainer - Estimated training time remaining: 4:42:16\n", + "2023-04-07 01:50:04,528 - INFO - allennlp.training.trainer - Epoch 156/399\n", + "2023-04-07 01:50:04,528 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:50:04,529 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:50:04,538 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9720, LAS: 0.9388, UEM: 0.7689, LEM: 0.5378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1274, partial_loss/deprel_loss: 0.2506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4183, loss: 0.4725, batch_reg_loss: 0.1924, reg_loss: 0.1924 ||: 3%|3 | 3/95 [00:02<01:18, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9635, LAS: 0.9312, UEM: 0.6470, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4703, loss: 0.5486, batch_reg_loss: 0.1923, reg_loss: 0.1924 ||: 7%|7 | 7/95 [00:04<01:07, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9643, LAS: 0.9318, UEM: 0.6621, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3464, partial_loss/deprel_loss: 0.3820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.5366, batch_reg_loss: 0.1923, reg_loss: 0.1924 ||: 11%|# | 10/95 [00:06<01:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9637, LAS: 0.9310, UEM: 0.6443, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2167, partial_loss/deprel_loss: 0.3162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5449, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 14%|#3 | 13/95 [00:09<01:00, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9632, LAS: 0.9304, UEM: 0.6377, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5822, loss: 0.5523, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 17%|#6 | 16/95 [00:11<00:59, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9620, LAS: 0.9297, UEM: 0.6260, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2540, partial_loss/deprel_loss: 0.2591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4504, loss: 0.5535, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 20%|## | 19/95 [00:13<00:55, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9637, LAS: 0.9310, UEM: 0.6589, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1565, partial_loss/deprel_loss: 0.3142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4749, loss: 0.5424, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 23%|##3 | 22/95 [00:15<00:53, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9598, LAS: 0.9271, UEM: 0.6327, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9984, partial_loss/deprel_loss: 0.6266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8933, loss: 0.5673, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 26%|##6 | 25/95 [00:17<00:51, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9616, LAS: 0.9289, UEM: 0.6562, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1413, partial_loss/deprel_loss: 0.2387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.5540, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 31%|### | 29/95 [00:20<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9615, LAS: 0.9287, UEM: 0.6530, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3790, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.5562, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 34%|###3 | 32/95 [00:22<00:45, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9615, LAS: 0.9284, UEM: 0.6475, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5956, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.5583, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 38%|###7 | 36/95 [00:25<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9623, LAS: 0.9290, UEM: 0.6547, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1599, partial_loss/deprel_loss: 0.3209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.5537, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||: 42%|####2 | 40/95 [00:27<00:37, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9627, LAS: 0.9291, UEM: 0.6520, LEM: 0.4224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3807, partial_loss/deprel_loss: 0.4060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.5514, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 46%|####6 | 44/95 [00:30<00:34, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9626, LAS: 0.9287, UEM: 0.6578, LEM: 0.4270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1378, partial_loss/deprel_loss: 0.2436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5531, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 49%|####9 | 47/95 [00:32<00:33, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9626, LAS: 0.9287, UEM: 0.6575, LEM: 0.4248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4665, loss: 0.5530, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 53%|#####2 | 50/95 [00:34<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9630, LAS: 0.9291, UEM: 0.6669, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3566, loss: 0.5501, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 56%|#####5 | 53/95 [00:37<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9635, LAS: 0.9296, UEM: 0.6707, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5104, loss: 0.5468, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 59%|#####8 | 56/95 [00:39<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9641, LAS: 0.9303, UEM: 0.6868, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2544, partial_loss/deprel_loss: 0.3112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4921, loss: 0.5414, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 62%|######2 | 59/95 [00:41<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9644, LAS: 0.9305, UEM: 0.6866, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1881, partial_loss/deprel_loss: 0.2736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.5393, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 65%|######5 | 62/95 [00:43<00:23, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9648, LAS: 0.9310, UEM: 0.6928, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5651, loss: 0.5360, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||: 68%|######8 | 65/95 [00:46<00:22, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9635, LAS: 0.9296, UEM: 0.6842, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8027, partial_loss/deprel_loss: 0.5600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.5462, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||: 73%|#######2 | 69/95 [00:48<00:18, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9636, LAS: 0.9297, UEM: 0.6881, LEM: 0.4622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5464, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||: 77%|#######6 | 73/95 [00:50<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9764, UAS: 0.9636, LAS: 0.9300, UEM: 0.6977, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0214, partial_loss/deprel_loss: 0.0955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2728, loss: 0.5453, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||: 81%|########1 | 77/95 [00:52<00:11, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9624, LAS: 0.9288, UEM: 0.6878, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3479, partial_loss/deprel_loss: 0.4048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.5535, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 85%|########5 | 81/95 [00:55<00:08, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9623, LAS: 0.9287, UEM: 0.6844, LEM: 0.4670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3306, partial_loss/deprel_loss: 0.4380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6087, loss: 0.5546, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 91%|######### | 86/95 [00:57<00:04, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9617, LAS: 0.9279, UEM: 0.6748, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4644, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6213, loss: 0.5612, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 96%|#########5| 91/95 [00:59<00:02, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9616, LAS: 0.9277, UEM: 0.6721, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5621, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:02<00:00, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9616, LAS: 0.9277, UEM: 0.6721, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5621, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:02<00:00, 1.51it/s]\n", + "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | N/A\n", + "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UEM | 0.672 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LEM | 0.452 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - EM | 0.935 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.222 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.336 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - loss | 0.562 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:51:10,733 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:51:15,513 - INFO - combo.training.trainer - Epoch duration: 0:01:10.985362\n", + "2023-04-07 01:51:15,514 - INFO - combo.training.trainer - Estimated training time remaining: 4:41:09\n", + "2023-04-07 01:51:15,514 - INFO - allennlp.training.trainer - Epoch 157/399\n", + "2023-04-07 01:51:15,514 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:51:15,515 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:51:15,526 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9344, UAS: 0.9738, LAS: 0.9382, UEM: 0.7844, LEM: 0.5275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5026, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 4%|4 | 4/95 [00:02<00:58, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9582, LAS: 0.9227, UEM: 0.6872, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2120, partial_loss/deprel_loss: 0.6602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9627, loss: 0.5984, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 8%|8 | 8/95 [00:05<00:56, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9627, LAS: 0.9272, UEM: 0.7279, LEM: 0.4885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.3992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.5602, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 13%|#2 | 12/95 [00:07<00:54, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9634, LAS: 0.9286, UEM: 0.7222, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.2052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3923, loss: 0.5488, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 16%|#5 | 15/95 [00:10<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9613, LAS: 0.9273, UEM: 0.6857, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.3671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5572, loss: 0.5681, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 20%|## | 19/95 [00:12<00:50, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9617, LAS: 0.9278, UEM: 0.6919, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4330, loss: 0.5624, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 24%|##4 | 23/95 [00:15<00:47, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9630, LAS: 0.9291, UEM: 0.7137, LEM: 0.4966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1964, partial_loss/deprel_loss: 0.2525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.5527, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 27%|##7 | 26/95 [00:17<00:47, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9634, LAS: 0.9295, UEM: 0.7100, LEM: 0.4893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1755, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4447, loss: 0.5503, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 31%|### | 29/95 [00:19<00:46, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9638, LAS: 0.9299, UEM: 0.7098, LEM: 0.4877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.3517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.5488, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||: 34%|###3 | 32/95 [00:22<00:45, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9628, LAS: 0.9285, UEM: 0.6919, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5739, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7344, loss: 0.5599, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 38%|###7 | 36/95 [00:24<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9634, LAS: 0.9293, UEM: 0.7012, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.5536, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 41%|####1 | 39/95 [00:26<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9629, LAS: 0.9287, UEM: 0.6886, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3934, partial_loss/deprel_loss: 0.4782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6533, loss: 0.5574, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 45%|####5 | 43/95 [00:29<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9615, LAS: 0.9273, UEM: 0.6715, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.5673, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 49%|####9 | 47/95 [00:31<00:32, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9616, LAS: 0.9273, UEM: 0.6700, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5664, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 53%|#####2 | 50/95 [00:33<00:30, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9618, LAS: 0.9275, UEM: 0.6755, LEM: 0.4539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1519, partial_loss/deprel_loss: 0.2576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4284, loss: 0.5625, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 56%|#####5 | 53/95 [00:36<00:29, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9614, LAS: 0.9269, UEM: 0.6713, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9562, partial_loss/deprel_loss: 0.5576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.5657, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 59%|#####8 | 56/95 [00:38<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9609, LAS: 0.9267, UEM: 0.6684, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2975, partial_loss/deprel_loss: 0.2845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4790, loss: 0.5669, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||: 62%|######2 | 59/95 [00:40<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9610, LAS: 0.9268, UEM: 0.6650, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3575, partial_loss/deprel_loss: 0.4162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5666, batch_reg_loss: 0.1920, reg_loss: 0.1920 ||: 66%|######6 | 63/95 [00:42<00:21, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9614, LAS: 0.9274, UEM: 0.6638, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.5629, batch_reg_loss: 0.1920, reg_loss: 0.1920 ||: 71%|####### | 67/95 [00:45<00:18, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9615, LAS: 0.9277, UEM: 0.6603, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.4155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6292, loss: 0.5623, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 75%|#######4 | 71/95 [00:48<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9614, LAS: 0.9276, UEM: 0.6570, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5893, partial_loss/deprel_loss: 0.4940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7050, loss: 0.5624, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 78%|#######7 | 74/95 [00:50<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9616, LAS: 0.9279, UEM: 0.6575, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5763, partial_loss/deprel_loss: 0.4984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.5618, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 81%|########1 | 77/95 [00:52<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9619, LAS: 0.9281, UEM: 0.6649, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0667, partial_loss/deprel_loss: 0.2107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3739, loss: 0.5604, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 84%|########4 | 80/95 [00:55<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9623, LAS: 0.9286, UEM: 0.6652, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.3376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5161, loss: 0.5585, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 88%|########8 | 84/95 [00:57<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9626, LAS: 0.9291, UEM: 0.6767, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3567, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6076, loss: 0.5566, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 92%|#########1| 87/95 [01:00<00:06, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9621, LAS: 0.9284, UEM: 0.6697, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8095, partial_loss/deprel_loss: 0.5292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7772, loss: 0.5611, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 96%|#########5| 91/95 [01:02<00:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9624, LAS: 0.9285, UEM: 0.6747, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1141, partial_loss/deprel_loss: 0.2310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3995, loss: 0.5591, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 100%|##########| 95/95 [01:04<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9624, LAS: 0.9285, UEM: 0.6747, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1141, partial_loss/deprel_loss: 0.2310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3995, loss: 0.5591, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 100%|##########| 95/95 [01:04<00:00, 1.46it/s]\n", + "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | N/A\n", + "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UEM | 0.675 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - LEM | 0.453 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - EM | 0.947 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.114 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.231 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - loss | 0.559 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:24,165 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:52:30,974 - INFO - combo.training.trainer - Epoch duration: 0:01:15.460015\n", + "2023-04-07 01:52:30,975 - INFO - combo.training.trainer - Estimated training time remaining: 4:40:09\n", + "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - Epoch 158/399\n", + "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:52:30,983 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9512, LAS: 0.9167, UEM: 0.4082, LEM: 0.1803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4347, partial_loss/deprel_loss: 0.3830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5852, loss: 0.6455, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 3%|3 | 3/95 [00:02<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9581, LAS: 0.9261, UEM: 0.5239, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4925, loss: 0.5920, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 6%|6 | 6/95 [00:04<01:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9609, LAS: 0.9278, UEM: 0.5954, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4652, loss: 0.5821, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 9%|9 | 9/95 [00:06<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9646, LAS: 0.9328, UEM: 0.7253, LEM: 0.5343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2249, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.5446, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 12%|#1 | 11/95 [00:08<01:07, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9666, LAS: 0.9345, UEM: 0.7312, LEM: 0.5271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.2457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4217, loss: 0.5319, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 15%|#4 | 14/95 [00:10<01:03, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9677, LAS: 0.9352, UEM: 0.7371, LEM: 0.5285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5060, loss: 0.5235, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||: 18%|#7 | 17/95 [00:13<01:00, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9656, LAS: 0.9328, UEM: 0.7227, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4180, loss: 0.5381, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||: 21%|##1 | 20/95 [00:15<00:56, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9658, LAS: 0.9335, UEM: 0.7145, LEM: 0.5046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2215, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.5310, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||: 25%|##5 | 24/95 [00:17<00:50, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9668, LAS: 0.9342, UEM: 0.7202, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4783, loss: 0.5258, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||: 28%|##8 | 27/95 [00:19<00:49, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9669, LAS: 0.9343, UEM: 0.7249, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5693, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.5244, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||: 32%|###1 | 30/95 [00:22<00:47, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9650, LAS: 0.9322, UEM: 0.7041, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.4029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5930, loss: 0.5382, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||: 36%|###5 | 34/95 [00:24<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9654, LAS: 0.9326, UEM: 0.7031, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2435, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4975, loss: 0.5356, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||: 40%|#### | 38/95 [00:27<00:38, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9647, LAS: 0.9321, UEM: 0.6988, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.2438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5386, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||: 44%|####4 | 42/95 [00:30<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9647, LAS: 0.9319, UEM: 0.6935, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3095, partial_loss/deprel_loss: 0.3647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5454, loss: 0.5406, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 48%|####8 | 46/95 [00:32<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9651, LAS: 0.9325, UEM: 0.7000, LEM: 0.4756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3892, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5890, loss: 0.5369, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 52%|#####1 | 49/95 [00:34<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9653, LAS: 0.9327, UEM: 0.7027, LEM: 0.4786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1235, partial_loss/deprel_loss: 0.2544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4200, loss: 0.5361, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 55%|#####4 | 52/95 [00:36<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9647, LAS: 0.9320, UEM: 0.6959, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6449, partial_loss/deprel_loss: 0.5230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.5420, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 58%|#####7 | 55/95 [00:39<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9646, LAS: 0.9317, UEM: 0.6893, LEM: 0.4628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3482, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.5438, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 61%|######1 | 58/95 [00:41<00:26, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9652, LAS: 0.9324, UEM: 0.6942, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.5389, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 65%|######5 | 62/95 [00:43<00:22, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9651, LAS: 0.9322, UEM: 0.6969, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.2259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3885, loss: 0.5402, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 68%|######8 | 65/95 [00:46<00:22, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9640, LAS: 0.9312, UEM: 0.6889, LEM: 0.4655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1801, partial_loss/deprel_loss: 0.5861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8966, loss: 0.5461, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 72%|#######1 | 68/95 [00:48<00:19, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9641, LAS: 0.9313, UEM: 0.6869, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2721, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5535, loss: 0.5456, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 76%|#######5 | 72/95 [00:51<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9638, LAS: 0.9309, UEM: 0.6826, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1630, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4307, loss: 0.5491, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 80%|######## | 76/95 [00:53<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9636, LAS: 0.9306, UEM: 0.6749, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5320, loss: 0.5515, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||: 84%|########4 | 80/95 [00:56<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9636, LAS: 0.9306, UEM: 0.6741, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.4970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7118, loss: 0.5511, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||: 88%|########8 | 84/95 [00:59<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9636, LAS: 0.9305, UEM: 0.6716, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2457, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.5515, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||: 92%|#########1| 87/95 [01:01<00:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9638, LAS: 0.9305, UEM: 0.6772, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4094, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6009, loss: 0.5505, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||: 95%|#########4| 90/95 [01:03<00:03, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9631, LAS: 0.9297, UEM: 0.6746, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 0.5688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8107, loss: 0.5554, batch_reg_loss: 0.1916, reg_loss: 0.1917 ||: 99%|#########8| 94/95 [01:05<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9633, LAS: 0.9300, UEM: 0.6788, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0983, partial_loss/deprel_loss: 0.2248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.5537, batch_reg_loss: 0.1916, reg_loss: 0.1917 ||: 100%|##########| 95/95 [01:06<00:00, 1.43it/s]\n", + "2023-04-07 01:53:40,249 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UEM | 0.679 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - LEM | 0.456 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EM | 0.956 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.098 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.225 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - loss | 0.554 | N/A\n", + "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - LAS | 0.930 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:42,138 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:53:46,737 - INFO - combo.training.trainer - Epoch duration: 0:01:15.762648\n", + "2023-04-07 01:53:46,738 - INFO - combo.training.trainer - Estimated training time remaining: 4:39:09\n", + "2023-04-07 01:53:46,738 - INFO - allennlp.training.trainer - Epoch 159/399\n", + "2023-04-07 01:53:46,738 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:53:46,739 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:53:46,748 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9558, LAS: 0.9254, UEM: 0.4000, LEM: 0.1876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2381, partial_loss/deprel_loss: 0.3095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.5982, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 5%|5 | 5/95 [00:02<00:42, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9604, LAS: 0.9288, UEM: 0.5916, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0738, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3887, loss: 0.5749, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 11%|# | 10/95 [00:04<00:40, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9642, LAS: 0.9318, UEM: 0.6435, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5529, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 14%|#3 | 13/95 [00:07<00:48, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9672, LAS: 0.9347, UEM: 0.7097, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1916, partial_loss/deprel_loss: 0.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4223, loss: 0.5279, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 17%|#6 | 16/95 [00:09<00:51, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9663, LAS: 0.9337, UEM: 0.6978, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 0.3682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.5315, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 20%|## | 19/95 [00:12<00:52, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9658, LAS: 0.9327, UEM: 0.6779, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3998, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6204, loss: 0.5353, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 23%|##3 | 22/95 [00:14<00:51, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9652, LAS: 0.9323, UEM: 0.6699, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.4153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6083, loss: 0.5388, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 26%|##6 | 25/95 [00:16<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9638, LAS: 0.9309, UEM: 0.6480, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.5503, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||: 31%|### | 29/95 [00:19<00:46, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9647, LAS: 0.9317, UEM: 0.6596, LEM: 0.4328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4591, partial_loss/deprel_loss: 0.4312, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6283, loss: 0.5452, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 35%|###4 | 33/95 [00:21<00:41, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9648, LAS: 0.9318, UEM: 0.6602, LEM: 0.4320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1464, partial_loss/deprel_loss: 0.2929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4551, loss: 0.5421, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 38%|###7 | 36/95 [00:23<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9636, LAS: 0.9308, UEM: 0.6529, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2751, partial_loss/deprel_loss: 0.3254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.5493, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 41%|####1 | 39/95 [00:26<00:39, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9634, LAS: 0.9305, UEM: 0.6588, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1040, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3889, loss: 0.5507, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 44%|####4 | 42/95 [00:28<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9628, LAS: 0.9299, UEM: 0.6538, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1895, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4600, loss: 0.5544, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 48%|####8 | 46/95 [00:30<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9632, LAS: 0.9302, UEM: 0.6575, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6014, loss: 0.5526, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 52%|#####1 | 49/95 [00:32<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9627, LAS: 0.9296, UEM: 0.6498, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5661, loss: 0.5555, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 56%|#####5 | 53/95 [00:35<00:27, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9629, LAS: 0.9298, UEM: 0.6488, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3685, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.5553, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||: 60%|###### | 57/95 [00:37<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9625, LAS: 0.9291, UEM: 0.6473, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 0.4626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6712, loss: 0.5580, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||: 64%|######4 | 61/95 [00:40<00:22, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9630, LAS: 0.9297, UEM: 0.6631, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1971, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4820, loss: 0.5543, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||: 68%|######8 | 65/95 [00:43<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9626, LAS: 0.9294, UEM: 0.6562, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4976, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5910, loss: 0.5566, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||: 72%|#######1 | 68/95 [00:46<00:19, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9630, LAS: 0.9297, UEM: 0.6571, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5550, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 76%|#######5 | 72/95 [00:48<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9630, LAS: 0.9298, UEM: 0.6630, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6367, partial_loss/deprel_loss: 0.5429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.5549, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 79%|#######8 | 75/95 [00:50<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9631, LAS: 0.9299, UEM: 0.6651, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2904, partial_loss/deprel_loss: 0.3650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5415, loss: 0.5535, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 82%|########2 | 78/95 [00:53<00:12, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9626, LAS: 0.9293, UEM: 0.6625, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.5566, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 85%|########5 | 81/95 [00:55<00:10, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9624, LAS: 0.9290, UEM: 0.6622, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3186, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5987, loss: 0.5579, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 89%|########9 | 85/95 [00:57<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9626, LAS: 0.9290, UEM: 0.6635, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5313, loss: 0.5574, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 93%|#########2| 88/95 [00:59<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9624, LAS: 0.9288, UEM: 0.6653, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9281, partial_loss/deprel_loss: 0.5648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8289, loss: 0.5582, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 96%|#########5| 91/95 [01:02<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9624, LAS: 0.9289, UEM: 0.6723, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0274, partial_loss/deprel_loss: 0.1028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2791, loss: 0.5586, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 100%|##########| 95/95 [01:05<00:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9624, LAS: 0.9289, UEM: 0.6723, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0274, partial_loss/deprel_loss: 0.1028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2791, loss: 0.5586, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 100%|##########| 95/95 [01:05<00:00, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:54:54,853 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:54:54,853 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - reg_loss | 0.192 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UEM | 0.672 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - LEM | 0.452 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EM | 0.973 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.027 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.103 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - loss | 0.559 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:54:54,859 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:54:58,881 - INFO - combo.training.trainer - Epoch duration: 0:01:12.142955\n", + "2023-04-07 01:54:58,882 - INFO - combo.training.trainer - Estimated training time remaining: 4:38:04\n", + "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - Epoch 160/399\n", + "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:54:58,890 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9763, LAS: 0.9455, UEM: 0.8416, LEM: 0.6602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4727, loss: 0.4444, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||: 3%|3 | 3/95 [00:02<01:15, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9635, LAS: 0.9305, UEM: 0.7475, LEM: 0.5457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6281, partial_loss/deprel_loss: 0.4631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6875, loss: 0.5448, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||: 7%|7 | 7/95 [00:04<01:06, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9628, LAS: 0.9300, UEM: 0.6904, LEM: 0.4797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3590, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5794, loss: 0.5437, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||: 13%|#2 | 12/95 [00:07<00:55, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9651, LAS: 0.9323, UEM: 0.7082, LEM: 0.4906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3948, loss: 0.5286, batch_reg_loss: 0.1913, reg_loss: 0.1914 ||: 18%|#7 | 17/95 [00:09<00:47, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9348, UAS: 0.9658, LAS: 0.9333, UEM: 0.7009, LEM: 0.4815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.5212, batch_reg_loss: 0.1913, reg_loss: 0.1914 ||: 23%|##3 | 22/95 [00:11<00:41, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9545, UAS: 0.9651, LAS: 0.9327, UEM: 0.6852, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1269, partial_loss/deprel_loss: 0.2500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4167, loss: 0.5297, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||: 28%|##8 | 27/95 [00:14<00:37, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9650, LAS: 0.9327, UEM: 0.6704, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3497, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5316, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||: 33%|###2 | 31/95 [00:17<00:37, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9657, LAS: 0.9333, UEM: 0.6804, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1903, partial_loss/deprel_loss: 0.3031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4718, loss: 0.5281, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||: 37%|###6 | 35/95 [00:20<00:38, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9650, LAS: 0.9328, UEM: 0.6808, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1476, partial_loss/deprel_loss: 0.2481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5313, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||: 41%|####1 | 39/95 [00:23<00:37, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9647, LAS: 0.9325, UEM: 0.6787, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.4110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.5324, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||: 44%|####4 | 42/95 [00:25<00:37, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9642, LAS: 0.9318, UEM: 0.6684, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.3724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.5373, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 48%|####8 | 46/95 [00:28<00:34, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9640, LAS: 0.9315, UEM: 0.6639, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1647, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4413, loss: 0.5395, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 52%|#####1 | 49/95 [00:30<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9648, LAS: 0.9324, UEM: 0.6768, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2503, partial_loss/deprel_loss: 0.3267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.5331, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 55%|#####4 | 52/95 [00:32<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9651, LAS: 0.9327, UEM: 0.6788, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4462, partial_loss/deprel_loss: 0.3923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5943, loss: 0.5310, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 59%|#####8 | 56/95 [00:34<00:26, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9646, LAS: 0.9321, UEM: 0.6794, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4600, partial_loss/deprel_loss: 0.4477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.5378, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 63%|######3 | 60/95 [00:37<00:23, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9507, UAS: 0.9639, LAS: 0.9315, UEM: 0.6732, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2364, partial_loss/deprel_loss: 0.2890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.5420, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 68%|######8 | 65/95 [00:40<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9639, LAS: 0.9315, UEM: 0.6766, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.4290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.5426, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 73%|#######2 | 69/95 [00:43<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9642, LAS: 0.9316, UEM: 0.6796, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2187, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5059, loss: 0.5414, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 77%|#######6 | 73/95 [00:46<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9633, LAS: 0.9308, UEM: 0.6734, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4063, partial_loss/deprel_loss: 0.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6109, loss: 0.5485, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 80%|######## | 76/95 [00:48<00:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9632, LAS: 0.9307, UEM: 0.6718, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.3529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5237, loss: 0.5496, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 83%|########3 | 79/95 [00:50<00:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9627, LAS: 0.9302, UEM: 0.6643, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3886, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5686, loss: 0.5549, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 86%|########6 | 82/95 [00:52<00:09, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9631, LAS: 0.9304, UEM: 0.6688, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.3865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.5524, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||: 91%|######### | 86/95 [00:55<00:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9768, UAS: 0.9637, LAS: 0.9313, UEM: 0.6856, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.0992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2755, loss: 0.5481, batch_reg_loss: 0.1911, reg_loss: 0.1913 ||: 94%|#########3| 89/95 [00:57<00:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9638, LAS: 0.9313, UEM: 0.6840, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3355, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5469, batch_reg_loss: 0.1911, reg_loss: 0.1912 ||: 98%|#########7| 93/95 [01:00<00:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9636, LAS: 0.9310, UEM: 0.6800, LEM: 0.4631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6199, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6722, loss: 0.5485, batch_reg_loss: 0.1911, reg_loss: 0.1912 ||: 100%|##########| 95/95 [01:01<00:00, 1.54it/s]\n", + "2023-04-07 01:56:03,562 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9694, LAS: 0.9243, UEM: 0.8308, LEM: 0.5652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1994, partial_loss/deprel_loss: 4.8253, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9001, loss: 5.2767, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:07, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9577, LAS: 0.9093, UEM: 0.7087, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0427, partial_loss/deprel_loss: 8.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9872, loss: 6.0390, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:05<00:04, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9586, LAS: 0.9096, UEM: 0.7243, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0864, partial_loss/deprel_loss: 13.6287, partial_loss/cycle_loss: 0.0000, batch_loss: 11.1203, loss: 6.2996, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 82%|########1 | 9/11 [00:08<00:01, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9520, LAS: 0.9019, UEM: 0.6842, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5402, partial_loss/deprel_loss: 18.2763, partial_loss/cycle_loss: 0.0000, batch_loss: 14.9291, loss: 7.6460, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9520, LAS: 0.9019, UEM: 0.6842, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5402, partial_loss/deprel_loss: 18.2763, partial_loss/cycle_loss: 0.0000, batch_loss: 14.9291, loss: 7.6460, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00, 1.02it/s]\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - reg_loss | 0.191 | 0.000\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UEM | 0.680 | 0.684\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - LEM | 0.463 | 0.409\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EM | 0.905 | 0.859\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.620 | 1.540\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UAS | 0.964 | 0.952\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.446 | 18.276\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - loss | 0.549 | 7.646\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | 0.902\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:14,334 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:56:21,425 - INFO - combo.training.trainer - Epoch duration: 0:01:22.543137\n", + "2023-04-07 01:56:21,426 - INFO - combo.training.trainer - Estimated training time remaining: 4:37:13\n", + "2023-04-07 01:56:21,426 - INFO - allennlp.training.trainer - Epoch 161/399\n", + "2023-04-07 01:56:21,426 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:56:21,427 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:56:21,437 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9555, LAS: 0.9184, UEM: 0.5959, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.6300, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 3%|3 | 3/95 [00:02<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9557, LAS: 0.9243, UEM: 0.5085, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5787, loss: 0.5879, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 7%|7 | 7/95 [00:04<00:58, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9628, LAS: 0.9307, UEM: 0.6356, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4656, loss: 0.5359, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 13%|#2 | 12/95 [00:07<00:52, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9621, LAS: 0.9294, UEM: 0.6676, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0854, partial_loss/deprel_loss: 0.2194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3837, loss: 0.5444, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 17%|#6 | 16/95 [00:09<00:48, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9627, LAS: 0.9303, UEM: 0.6596, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5670, loss: 0.5401, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 21%|##1 | 20/95 [00:11<00:45, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9648, LAS: 0.9327, UEM: 0.6894, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1833, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.5236, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 25%|##5 | 24/95 [00:14<00:42, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9639, LAS: 0.9313, UEM: 0.6683, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.3911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5682, loss: 0.5348, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||: 29%|##9 | 28/95 [00:16<00:41, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9643, LAS: 0.9318, UEM: 0.6854, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7576, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7267, loss: 0.5320, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 34%|###3 | 32/95 [00:19<00:38, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9627, LAS: 0.9301, UEM: 0.6603, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3612, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.5463, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 39%|###8 | 37/95 [00:21<00:32, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9624, LAS: 0.9297, UEM: 0.6565, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1974, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4524, loss: 0.5493, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 44%|####4 | 42/95 [00:23<00:27, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9625, LAS: 0.9298, UEM: 0.6596, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2212, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.5477, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 48%|####8 | 46/95 [00:26<00:28, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9631, LAS: 0.9304, UEM: 0.6641, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5449, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 53%|#####2 | 50/95 [00:29<00:27, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9642, LAS: 0.9315, UEM: 0.6857, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.2576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4230, loss: 0.5365, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 57%|#####6 | 54/95 [00:32<00:26, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9639, LAS: 0.9311, UEM: 0.6912, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5797, partial_loss/deprel_loss: 0.4343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6543, loss: 0.5392, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||: 61%|######1 | 58/95 [00:34<00:24, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9639, LAS: 0.9308, UEM: 0.6910, LEM: 0.4648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2046, partial_loss/deprel_loss: 0.3376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.5417, batch_reg_loss: 0.1910, reg_loss: 0.1910 ||: 65%|######5 | 62/95 [00:37<00:21, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9455, UAS: 0.9638, LAS: 0.9310, UEM: 0.7006, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.2678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4575, loss: 0.5400, batch_reg_loss: 0.1910, reg_loss: 0.1910 ||: 69%|######9 | 66/95 [00:40<00:20, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9639, LAS: 0.9311, UEM: 0.7003, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1505, partial_loss/deprel_loss: 0.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4464, loss: 0.5398, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 73%|#######2 | 69/95 [00:42<00:18, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9637, LAS: 0.9308, UEM: 0.6971, LEM: 0.4801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4598, loss: 0.5418, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 76%|#######5 | 72/95 [00:45<00:16, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9636, LAS: 0.9308, UEM: 0.6915, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5565, partial_loss/deprel_loss: 0.4021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.5427, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 79%|#######8 | 75/95 [00:47<00:14, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9626, LAS: 0.9298, UEM: 0.6839, LEM: 0.4676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 0.5497, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 82%|########2 | 78/95 [00:49<00:12, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9625, LAS: 0.9297, UEM: 0.6848, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3127, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.5505, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 85%|########5 | 81/95 [00:51<00:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9625, LAS: 0.9297, UEM: 0.6827, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3948, partial_loss/deprel_loss: 0.3623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.5507, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 88%|########8 | 84/95 [00:53<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9624, LAS: 0.9294, UEM: 0.6783, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2434, partial_loss/deprel_loss: 0.3092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.5525, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 92%|#########1| 87/95 [00:55<00:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9622, LAS: 0.9292, UEM: 0.6732, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6044, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6656, loss: 0.5544, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 95%|#########4| 90/95 [00:57<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9625, LAS: 0.9295, UEM: 0.6752, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4919, loss: 0.5530, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 98%|#########7| 93/95 [00:59<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9624, LAS: 0.9294, UEM: 0.6733, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4885, partial_loss/deprel_loss: 0.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.5530, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 100%|##########| 95/95 [01:01<00:00, 1.55it/s]\n", + "2023-04-07 01:57:25,711 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:57:25,711 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - reg_loss | 0.191 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UEM | 0.673 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LEM | 0.456 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EM | 0.912 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.488 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.433 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - loss | 0.553 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:57:25,713 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:57:25,713 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:57:25,717 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:57:30,571 - INFO - combo.training.trainer - Epoch duration: 0:01:09.144809\n", + "2023-04-07 01:57:30,571 - INFO - combo.training.trainer - Estimated training time remaining: 4:36:03\n", + "2023-04-07 01:57:30,571 - INFO - allennlp.training.trainer - Epoch 162/399\n", + "2023-04-07 01:57:30,572 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:57:30,572 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:57:30,581 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9612, LAS: 0.9282, UEM: 0.6256, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2923, partial_loss/deprel_loss: 0.2939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4845, loss: 0.5527, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 3%|3 | 3/95 [00:02<01:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9637, LAS: 0.9303, UEM: 0.6470, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.3002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4834, loss: 0.5343, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 6%|6 | 6/95 [00:04<01:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9655, LAS: 0.9322, UEM: 0.6758, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1586, partial_loss/deprel_loss: 0.2265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4038, loss: 0.5210, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 9%|9 | 9/95 [00:06<01:01, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9663, LAS: 0.9335, UEM: 0.6827, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.4342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6432, loss: 0.5187, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 14%|#3 | 13/95 [00:09<00:57, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9649, LAS: 0.9321, UEM: 0.6541, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5915, partial_loss/deprel_loss: 0.4867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6985, loss: 0.5344, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 17%|#6 | 16/95 [00:11<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9638, LAS: 0.9311, UEM: 0.6333, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6412, partial_loss/deprel_loss: 0.4716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.5446, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 20%|## | 19/95 [00:13<00:53, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9652, LAS: 0.9328, UEM: 0.6613, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.5312, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||: 23%|##3 | 22/95 [00:15<00:55, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9649, LAS: 0.9326, UEM: 0.6584, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4952, partial_loss/deprel_loss: 0.4124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5325, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||: 26%|##6 | 25/95 [00:17<00:51, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9648, LAS: 0.9324, UEM: 0.6507, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5078, partial_loss/deprel_loss: 0.4754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6727, loss: 0.5364, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||: 31%|### | 29/95 [00:20<00:46, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9663, LAS: 0.9335, UEM: 0.6773, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5272, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||: 35%|###4 | 33/95 [00:23<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9653, LAS: 0.9324, UEM: 0.6630, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5060, partial_loss/deprel_loss: 0.4764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6731, loss: 0.5343, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||: 38%|###7 | 36/95 [00:25<00:41, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9654, LAS: 0.9324, UEM: 0.6623, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4791, loss: 0.5342, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||: 41%|####1 | 39/95 [00:27<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9639, LAS: 0.9307, UEM: 0.6514, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4177, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5691, loss: 0.5440, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||: 45%|####5 | 43/95 [00:29<00:34, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9629, LAS: 0.9299, UEM: 0.6561, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1249, partial_loss/deprel_loss: 0.2237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3947, loss: 0.5477, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||: 51%|##### | 48/95 [00:32<00:28, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9627, LAS: 0.9296, UEM: 0.6457, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3377, partial_loss/deprel_loss: 0.3512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5393, loss: 0.5492, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||: 56%|#####5 | 53/95 [00:34<00:23, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9619, LAS: 0.9288, UEM: 0.6347, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3078, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5566, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||: 61%|######1 | 58/95 [00:36<00:19, 1.93it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9724, UAS: 0.9630, LAS: 0.9303, UEM: 0.6753, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0364, partial_loss/deprel_loss: 0.1030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2805, loss: 0.5460, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||: 66%|######6 | 63/95 [00:39<00:16, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9636, LAS: 0.9310, UEM: 0.6836, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2450, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 0.5414, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 72%|#######1 | 68/95 [00:41<00:13, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9630, LAS: 0.9301, UEM: 0.6758, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3095, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.5470, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 77%|#######6 | 73/95 [00:43<00:10, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9631, LAS: 0.9303, UEM: 0.6746, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1627, partial_loss/deprel_loss: 0.3092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.5461, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 82%|########2 | 78/95 [00:45<00:07, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9633, LAS: 0.9303, UEM: 0.6780, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0843, partial_loss/deprel_loss: 0.2144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3791, loss: 0.5461, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 87%|########7 | 83/95 [00:47<00:05, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9631, LAS: 0.9300, UEM: 0.6730, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4936, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.5479, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 93%|#########2| 88/95 [00:50<00:03, 2.15it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9630, LAS: 0.9299, UEM: 0.6716, LEM: 0.4537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4188, loss: 0.5476, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 98%|#########7| 93/95 [00:52<00:00, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9631, LAS: 0.9301, UEM: 0.6724, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3475, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.5462, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 100%|##########| 95/95 [00:53<00:00, 1.77it/s]\n", + "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - reg_loss | 0.191 | N/A\n", + "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UEM | 0.672 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LEM | 0.454 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.347 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.391 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - loss | 0.546 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LAS | 0.930 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:58:26,962 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:58:26,962 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:58:26,966 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:58:34,185 - INFO - combo.training.trainer - Epoch duration: 0:01:03.613676\n", + "2023-04-07 01:58:34,186 - INFO - combo.training.trainer - Estimated training time remaining: 4:34:45\n", + "2023-04-07 01:58:34,186 - INFO - allennlp.training.trainer - Epoch 163/399\n", + "2023-04-07 01:58:34,186 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:58:34,187 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:58:34,197 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9738, LAS: 0.9427, UEM: 0.7407, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.3351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.4713, batch_reg_loss: 0.1907, reg_loss: 0.1907 ||: 5%|5 | 5/95 [00:02<00:43, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9726, LAS: 0.9422, UEM: 0.7833, LEM: 0.5907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.3165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.4745, batch_reg_loss: 0.1906, reg_loss: 0.1907 ||: 9%|9 | 9/95 [00:04<00:41, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9705, LAS: 0.9395, UEM: 0.7353, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3920, partial_loss/deprel_loss: 0.3697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.4920, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||: 15%|#4 | 14/95 [00:06<00:38, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9726, LAS: 0.9415, UEM: 0.7816, LEM: 0.5827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2579, partial_loss/deprel_loss: 0.3561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5270, loss: 0.4757, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||: 19%|#8 | 18/95 [00:08<00:37, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9678, LAS: 0.9356, UEM: 0.7379, LEM: 0.5402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.3727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5532, loss: 0.5152, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||: 24%|##4 | 23/95 [00:11<00:34, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9665, LAS: 0.9344, UEM: 0.7124, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2866, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.5233, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||: 29%|##9 | 28/95 [00:13<00:31, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9660, LAS: 0.9340, UEM: 0.7136, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0685, partial_loss/deprel_loss: 0.1542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3276, loss: 0.5238, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||: 35%|###4 | 33/95 [00:15<00:29, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9666, LAS: 0.9346, UEM: 0.7175, LEM: 0.5170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1808, partial_loss/deprel_loss: 0.2531, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4292, loss: 0.5215, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 39%|###8 | 37/95 [00:17<00:28, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9651, LAS: 0.9329, UEM: 0.7028, LEM: 0.5034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5526, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 0.5335, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 44%|####4 | 42/95 [00:20<00:26, 2.02it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9636, LAS: 0.9312, UEM: 0.6875, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7577, partial_loss/deprel_loss: 0.6006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8225, loss: 0.5440, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 49%|####9 | 47/95 [00:22<00:23, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9623, LAS: 0.9297, UEM: 0.6766, LEM: 0.4765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.5541, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 55%|#####4 | 52/95 [00:25<00:21, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9624, LAS: 0.9298, UEM: 0.6881, LEM: 0.4863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1182, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5534, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 60%|###### | 57/95 [00:27<00:18, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9624, LAS: 0.9296, UEM: 0.6822, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.5547, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 65%|######5 | 62/95 [00:30<00:16, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9635, LAS: 0.9306, UEM: 0.6920, LEM: 0.4800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1464, partial_loss/deprel_loss: 0.2588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4269, loss: 0.5480, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 71%|####### | 67/95 [00:32<00:13, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9633, LAS: 0.9302, UEM: 0.6827, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4574, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6042, loss: 0.5511, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 76%|#######5 | 72/95 [00:34<00:10, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9631, LAS: 0.9301, UEM: 0.6784, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4201, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6041, loss: 0.5508, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 81%|########1 | 77/95 [00:37<00:08, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9632, LAS: 0.9301, UEM: 0.6764, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4449, loss: 0.5505, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||: 86%|########6 | 82/95 [00:39<00:06, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9633, LAS: 0.9301, UEM: 0.6720, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2312, partial_loss/deprel_loss: 0.3471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5502, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||: 92%|#########1| 87/95 [00:41<00:03, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9632, LAS: 0.9301, UEM: 0.6725, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5510, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||: 97%|#########6| 92/95 [00:44<00:01, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9636, LAS: 0.9305, UEM: 0.6769, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0981, partial_loss/deprel_loss: 0.2375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.5482, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||: 100%|##########| 95/95 [00:45<00:00, 2.09it/s]\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - reg_loss | 0.191 | N/A\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - UEM | 0.677 | N/A\n", + "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - LEM | 0.460 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - EM | 0.953 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.098 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - UAS | 0.964 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.238 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - loss | 0.548 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - LAS | 0.930 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:59:22,902 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 01:59:27,729 - INFO - combo.training.trainer - Epoch duration: 0:00:53.542821\n", + "2023-04-07 01:59:27,729 - INFO - combo.training.trainer - Estimated training time remaining: 4:33:12\n", + "2023-04-07 01:59:27,729 - INFO - allennlp.training.trainer - Epoch 164/399\n", + "2023-04-07 01:59:27,730 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 01:59:27,730 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:59:27,740 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9619, LAS: 0.9298, UEM: 0.5734, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5451, partial_loss/deprel_loss: 0.4259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6402, loss: 0.5597, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 5%|5 | 5/95 [00:02<00:44, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9635, LAS: 0.9322, UEM: 0.5934, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5574, partial_loss/deprel_loss: 0.3986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6208, loss: 0.5415, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 11%|# | 10/95 [00:04<00:40, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9623, LAS: 0.9315, UEM: 0.5744, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6257, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6951, loss: 0.5491, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 16%|#5 | 15/95 [00:06<00:37, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9658, LAS: 0.9341, UEM: 0.6419, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1404, partial_loss/deprel_loss: 0.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4234, loss: 0.5297, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 21%|##1 | 20/95 [00:09<00:35, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9634, LAS: 0.9315, UEM: 0.6415, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4832, loss: 0.5432, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 26%|##6 | 25/95 [00:11<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9616, LAS: 0.9299, UEM: 0.6162, LEM: 0.3831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.5513, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 32%|###1 | 30/95 [00:13<00:29, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9616, LAS: 0.9295, UEM: 0.6095, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5807, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.5535, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 37%|###6 | 35/95 [00:15<00:26, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9611, LAS: 0.9289, UEM: 0.6072, LEM: 0.3795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1790, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4357, loss: 0.5548, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||: 42%|####2 | 40/95 [00:18<00:25, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9623, LAS: 0.9302, UEM: 0.6283, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.3416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5459, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 47%|####7 | 45/95 [00:20<00:23, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9616, LAS: 0.9293, UEM: 0.6202, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2663, partial_loss/deprel_loss: 0.3061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.5515, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9611, LAS: 0.9288, UEM: 0.6350, LEM: 0.4137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1256, partial_loss/deprel_loss: 0.2711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4323, loss: 0.5548, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 58%|#####7 | 55/95 [00:25<00:19, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9617, LAS: 0.9293, UEM: 0.6479, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.5513, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 63%|######3 | 60/95 [00:28<00:17, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9625, LAS: 0.9300, UEM: 0.6559, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.3304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.5457, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 68%|######8 | 65/95 [00:30<00:14, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9632, LAS: 0.9307, UEM: 0.6727, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.5400, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 74%|#######3 | 70/95 [00:32<00:12, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9637, LAS: 0.9317, UEM: 0.6923, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0938, partial_loss/deprel_loss: 0.2573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.5344, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||: 79%|#######8 | 75/95 [00:35<00:09, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9638, LAS: 0.9317, UEM: 0.6925, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7460, loss: 0.5358, batch_reg_loss: 0.1902, reg_loss: 0.1904 ||: 84%|########4 | 80/95 [00:37<00:07, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9633, LAS: 0.9311, UEM: 0.6860, LEM: 0.4731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1684, partial_loss/deprel_loss: 0.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.5391, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 89%|########9 | 85/95 [00:39<00:04, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9632, LAS: 0.9308, UEM: 0.6815, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2699, partial_loss/deprel_loss: 0.3483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5229, loss: 0.5407, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 95%|#########4| 90/95 [00:42<00:02, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9631, LAS: 0.9307, UEM: 0.6746, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5432, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 100%|##########| 95/95 [00:44<00:00, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9631, LAS: 0.9307, UEM: 0.6746, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5432, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 100%|##########| 95/95 [00:44<00:00, 2.13it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - reg_loss | 0.190 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - UEM | 0.675 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - LEM | 0.459 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EM | 0.925 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.405 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.395 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - loss | 0.543 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:00:15,295 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:00:20,102 - INFO - combo.training.trainer - Epoch duration: 0:00:52.372078\n", + "2023-04-07 02:00:20,102 - INFO - combo.training.trainer - Estimated training time remaining: 4:31:38\n", + "2023-04-07 02:00:20,102 - INFO - allennlp.training.trainer - Epoch 165/399\n", + "2023-04-07 02:00:20,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:00:20,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:00:20,113 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9573, LAS: 0.9240, UEM: 0.5156, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7770, partial_loss/deprel_loss: 0.5007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.5904, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||: 5%|5 | 5/95 [00:02<00:41, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9650, LAS: 0.9322, UEM: 0.6708, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.3998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5407, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||: 11%|# | 10/95 [00:04<00:39, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9678, LAS: 0.9353, UEM: 0.7127, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1809, partial_loss/deprel_loss: 0.2555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4308, loss: 0.5196, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||: 15%|#4 | 14/95 [00:06<00:38, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9650, LAS: 0.9318, UEM: 0.6826, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6285, partial_loss/deprel_loss: 0.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6952, loss: 0.5403, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||: 20%|## | 19/95 [00:08<00:35, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9671, LAS: 0.9345, UEM: 0.7417, LEM: 0.5474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1539, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4421, loss: 0.5187, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||: 24%|##4 | 23/95 [00:11<00:35, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9666, LAS: 0.9343, UEM: 0.7245, LEM: 0.5267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.5220, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 29%|##9 | 28/95 [00:13<00:32, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9647, LAS: 0.9324, UEM: 0.7068, LEM: 0.5070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6443, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.5348, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 35%|###4 | 33/95 [00:15<00:29, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9652, LAS: 0.9329, UEM: 0.7001, LEM: 0.4969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2062, partial_loss/deprel_loss: 0.2855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5303, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 40%|#### | 38/95 [00:18<00:27, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9655, LAS: 0.9333, UEM: 0.7031, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1846, partial_loss/deprel_loss: 0.2773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.5274, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 45%|####5 | 43/95 [00:20<00:24, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9638, LAS: 0.9314, UEM: 0.6898, LEM: 0.4807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5657, partial_loss/deprel_loss: 0.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.5381, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 51%|##### | 48/95 [00:22<00:21, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9632, LAS: 0.9309, UEM: 0.6809, LEM: 0.4694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5652, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7000, loss: 0.5434, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||: 56%|#####5 | 53/95 [00:24<00:19, 2.21it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9642, LAS: 0.9317, UEM: 0.6983, LEM: 0.4861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0907, partial_loss/deprel_loss: 0.2074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3741, loss: 0.5356, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||: 61%|######1 | 58/95 [00:27<00:17, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9344, UAS: 0.9641, LAS: 0.9314, UEM: 0.6879, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3749, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5394, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||: 66%|######6 | 63/95 [00:29<00:14, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9640, LAS: 0.9312, UEM: 0.6810, LEM: 0.4659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4680, partial_loss/deprel_loss: 0.4725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.5400, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||: 72%|#######1 | 68/95 [00:31<00:12, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9635, LAS: 0.9308, UEM: 0.6824, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2634, partial_loss/deprel_loss: 0.3195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4983, loss: 0.5429, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 77%|#######6 | 73/95 [00:34<00:10, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9633, LAS: 0.9308, UEM: 0.6798, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.4904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7235, loss: 0.5438, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 82%|########2 | 78/95 [00:36<00:08, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9637, LAS: 0.9311, UEM: 0.6769, LEM: 0.4616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3138, partial_loss/deprel_loss: 0.3029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.5419, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 87%|########7 | 83/95 [00:39<00:05, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9642, LAS: 0.9316, UEM: 0.6870, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4966, loss: 0.5379, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 93%|#########2| 88/95 [00:41<00:03, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9635, LAS: 0.9308, UEM: 0.6806, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4357, loss: 0.5434, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 98%|#########7| 93/95 [00:44<00:00, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9633, LAS: 0.9307, UEM: 0.6768, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.3600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5702, loss: 0.5447, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 100%|##########| 95/95 [00:45<00:00, 2.10it/s]\n", + "2023-04-07 02:01:08,477 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9448, LAS: 0.8860, UEM: 0.5352, LEM: 0.1796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5433, partial_loss/deprel_loss: 7.2230, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8870, loss: 6.9931, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:02<00:04, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9505, LAS: 0.8974, UEM: 0.6350, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 6.9281, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6240, loss: 7.0933, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:04<00:02, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8590, UAS: 0.9515, LAS: 0.9005, UEM: 0.7005, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5050, partial_loss/deprel_loss: 16.8045, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7446, loss: 7.1973, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:06<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9514, LAS: 0.8998, UEM: 0.6857, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9330, partial_loss/deprel_loss: 9.0223, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4045, loss: 7.2161, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.47it/s] \n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - reg_loss | 0.190 | 0.000\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UEM | 0.677 | 0.686\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - LEM | 0.461 | 0.408\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EM | 0.929 | 0.893\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.461 | 0.933\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | 0.951\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.360 | 9.022\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - loss | 0.545 | 7.216\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | 0.900\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:01:15,996 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:01:20,786 - INFO - combo.training.trainer - Epoch duration: 0:01:00.683444\n", + "2023-04-07 02:01:20,786 - INFO - combo.training.trainer - Estimated training time remaining: 4:30:17\n", + "2023-04-07 02:01:20,786 - INFO - allennlp.training.trainer - Epoch 166/399\n", + "2023-04-07 02:01:20,787 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:01:20,787 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:01:20,797 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9630, LAS: 0.9317, UEM: 0.5782, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5015, loss: 0.5402, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||: 5%|5 | 5/95 [00:02<00:39, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9617, LAS: 0.9299, UEM: 0.5833, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6250, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.5524, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||: 11%|# | 10/95 [00:04<00:38, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9609, LAS: 0.9288, UEM: 0.6356, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1701, partial_loss/deprel_loss: 0.2190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3992, loss: 0.5518, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||: 16%|#5 | 15/95 [00:07<00:37, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9625, LAS: 0.9310, UEM: 0.6482, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.5423, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||: 21%|##1 | 20/95 [00:09<00:35, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9658, LAS: 0.9344, UEM: 0.7192, LEM: 0.5075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1990, partial_loss/deprel_loss: 0.2955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4662, loss: 0.5199, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||: 25%|##5 | 24/95 [00:11<00:33, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9667, LAS: 0.9357, UEM: 0.7434, LEM: 0.5478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.0946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2706, loss: 0.5135, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||: 29%|##9 | 28/95 [00:13<00:32, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9642, LAS: 0.9332, UEM: 0.7205, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2251, partial_loss/deprel_loss: 0.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4872, loss: 0.5324, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||: 35%|###4 | 33/95 [00:16<00:30, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9642, LAS: 0.9329, UEM: 0.7150, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6486, loss: 0.5328, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||: 40%|#### | 38/95 [00:18<00:27, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9655, LAS: 0.9340, UEM: 0.7234, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0865, partial_loss/deprel_loss: 0.2346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3949, loss: 0.5269, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||: 45%|####5 | 43/95 [00:20<00:24, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9656, LAS: 0.9338, UEM: 0.7135, LEM: 0.5010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3880, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.5266, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||: 51%|##### | 48/95 [00:23<00:22, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9664, LAS: 0.9343, UEM: 0.7228, LEM: 0.5068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0947, partial_loss/deprel_loss: 0.2209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3855, loss: 0.5215, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||: 56%|#####5 | 53/95 [00:25<00:20, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9662, LAS: 0.9339, UEM: 0.7176, LEM: 0.5030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3663, partial_loss/deprel_loss: 0.4278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6054, loss: 0.5242, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||: 61%|######1 | 58/95 [00:27<00:17, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9368, UAS: 0.9666, LAS: 0.9343, UEM: 0.7131, LEM: 0.4957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2723, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5230, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||: 66%|######6 | 63/95 [00:30<00:15, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9655, LAS: 0.9330, UEM: 0.7009, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3474, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.5304, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 72%|#######1 | 68/95 [00:32<00:12, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9650, LAS: 0.9325, UEM: 0.6981, LEM: 0.4813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.4150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6181, loss: 0.5332, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 77%|#######6 | 73/95 [00:35<00:10, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9649, LAS: 0.9324, UEM: 0.6913, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4917, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5346, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 82%|########2 | 78/95 [00:37<00:08, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9652, LAS: 0.9326, UEM: 0.6916, LEM: 0.4719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4802, loss: 0.5338, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 87%|########7 | 83/95 [00:39<00:05, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9649, LAS: 0.9321, UEM: 0.6894, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 0.4445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6367, loss: 0.5362, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 93%|#########2| 88/95 [00:42<00:03, 2.12it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9646, LAS: 0.9318, UEM: 0.6823, LEM: 0.4627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7761, partial_loss/deprel_loss: 0.4415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.5384, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 98%|#########7| 93/95 [00:44<00:00, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9643, LAS: 0.9315, UEM: 0.6814, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2074, partial_loss/deprel_loss: 0.2274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4132, loss: 0.5408, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 100%|##########| 95/95 [00:45<00:00, 2.10it/s]\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - reg_loss | 0.190 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - UEM | 0.681 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - LEM | 0.463 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EM | 0.945 | N/A\n", + "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.207 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - UAS | 0.964 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.227 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - loss | 0.541 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - LAS | 0.932 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:02:09,286 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:02:14,100 - INFO - combo.training.trainer - Epoch duration: 0:00:53.313553\n", + "2023-04-07 02:02:14,100 - INFO - combo.training.trainer - Estimated training time remaining: 4:28:45\n", + "2023-04-07 02:02:14,101 - INFO - allennlp.training.trainer - Epoch 167/399\n", + "2023-04-07 02:02:14,101 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:02:14,102 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:02:14,110 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9654, LAS: 0.9332, UEM: 0.6255, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1278, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4161, loss: 0.5278, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||: 5%|5 | 5/95 [00:02<00:43, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9584, LAS: 0.9268, UEM: 0.6078, LEM: 0.3995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1507, partial_loss/deprel_loss: 0.6453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9362, loss: 0.5770, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||: 9%|9 | 9/95 [00:04<00:42, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9615, LAS: 0.9300, UEM: 0.6402, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1392, partial_loss/deprel_loss: 0.2267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3990, loss: 0.5564, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||: 14%|#3 | 13/95 [00:06<00:40, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9644, LAS: 0.9332, UEM: 0.6783, LEM: 0.4616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2646, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4887, loss: 0.5265, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||: 19%|#8 | 18/95 [00:08<00:37, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9633, LAS: 0.9322, UEM: 0.6436, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2725, partial_loss/deprel_loss: 0.2990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.5361, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||: 24%|##4 | 23/95 [00:11<00:34, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9625, LAS: 0.9311, UEM: 0.6389, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1966, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5427, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||: 29%|##9 | 28/95 [00:13<00:32, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9623, LAS: 0.9310, UEM: 0.6383, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8791, partial_loss/deprel_loss: 0.5183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7802, loss: 0.5432, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||: 35%|###4 | 33/95 [00:16<00:29, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9624, LAS: 0.9309, UEM: 0.6327, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1652, partial_loss/deprel_loss: 0.3114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4718, loss: 0.5450, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||: 40%|#### | 38/95 [00:18<00:26, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9632, LAS: 0.9319, UEM: 0.6344, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2448, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4543, loss: 0.5403, batch_reg_loss: 0.1897, reg_loss: 0.1897 ||: 45%|####5 | 43/95 [00:20<00:24, 2.16it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9639, LAS: 0.9326, UEM: 0.6478, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5301, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.5358, batch_reg_loss: 0.1897, reg_loss: 0.1897 ||: 51%|##### | 48/95 [00:22<00:22, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9643, LAS: 0.9329, UEM: 0.6518, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4277, partial_loss/deprel_loss: 0.4355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6236, loss: 0.5326, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 56%|#####5 | 53/95 [00:25<00:19, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9645, LAS: 0.9330, UEM: 0.6463, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3142, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5341, loss: 0.5324, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 61%|######1 | 58/95 [00:27<00:17, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9648, LAS: 0.9333, UEM: 0.6506, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2682, partial_loss/deprel_loss: 0.3169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.5293, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 66%|######6 | 63/95 [00:29<00:14, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9653, LAS: 0.9337, UEM: 0.6653, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3111, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.5264, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 72%|#######1 | 68/95 [00:32<00:12, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9649, LAS: 0.9334, UEM: 0.6681, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4777, loss: 0.5303, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 77%|#######6 | 73/95 [00:34<00:10, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9654, LAS: 0.9338, UEM: 0.6709, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.2615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4394, loss: 0.5279, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||: 82%|########2 | 78/95 [00:36<00:07, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9736, UAS: 0.9662, LAS: 0.9346, UEM: 0.6955, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0278, partial_loss/deprel_loss: 0.1079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2814, loss: 0.5208, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||: 87%|########7 | 83/95 [00:39<00:06, 1.97it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9661, LAS: 0.9344, UEM: 0.6960, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.5217, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||: 92%|#########1| 87/95 [00:41<00:04, 1.98it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9657, LAS: 0.9341, UEM: 0.6945, LEM: 0.4807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1499, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4085, loss: 0.5231, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||: 97%|#########6| 92/95 [00:44<00:01, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9651, LAS: 0.9334, UEM: 0.6874, LEM: 0.4750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6916, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.5286, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||: 100%|##########| 95/95 [00:45<00:00, 2.07it/s]\n", + "2023-04-07 02:03:02,709 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - reg_loss | 0.190 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - UEM | 0.687 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - LEM | 0.475 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EM | 0.908 | N/A\n", + "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.692 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - UAS | 0.965 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.474 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - loss | 0.529 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - LAS | 0.933 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:02,717 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:03:07,245 - INFO - combo.training.trainer - Epoch duration: 0:00:53.144077\n", + "2023-04-07 02:03:07,245 - INFO - combo.training.trainer - Estimated training time remaining: 4:27:14\n", + "2023-04-07 02:03:07,246 - INFO - allennlp.training.trainer - Epoch 168/399\n", + "2023-04-07 02:03:07,246 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:03:07,247 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:03:07,257 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9666, LAS: 0.9362, UEM: 0.6196, LEM: 0.3873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.2921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4755, loss: 0.5008, batch_reg_loss: 0.1895, reg_loss: 0.1895 ||: 5%|5 | 5/95 [00:02<00:38, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9671, LAS: 0.9346, UEM: 0.6740, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.4462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6664, loss: 0.5037, batch_reg_loss: 0.1895, reg_loss: 0.1895 ||: 9%|9 | 9/95 [00:04<00:39, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9649, LAS: 0.9325, UEM: 0.6628, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.3403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.5212, batch_reg_loss: 0.1894, reg_loss: 0.1895 ||: 15%|#4 | 14/95 [00:06<00:36, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9664, LAS: 0.9347, UEM: 0.6997, LEM: 0.4825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4664, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6058, loss: 0.5104, batch_reg_loss: 0.1894, reg_loss: 0.1895 ||: 20%|## | 19/95 [00:08<00:34, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9641, LAS: 0.9330, UEM: 0.6694, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3107, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.5253, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||: 25%|##5 | 24/95 [00:11<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9620, LAS: 0.9311, UEM: 0.6397, LEM: 0.4237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8955, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7307, loss: 0.5400, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||: 31%|### | 29/95 [00:13<00:30, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9614, LAS: 0.9305, UEM: 0.6237, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.3106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5452, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||: 36%|###5 | 34/95 [00:15<00:27, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9617, LAS: 0.9309, UEM: 0.6249, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1641, partial_loss/deprel_loss: 0.2673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.5443, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||: 41%|####1 | 39/95 [00:18<00:26, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9625, LAS: 0.9318, UEM: 0.6325, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3411, partial_loss/deprel_loss: 0.3364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5372, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 46%|####6 | 44/95 [00:20<00:24, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9629, LAS: 0.9323, UEM: 0.6364, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1839, partial_loss/deprel_loss: 0.2767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.5370, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 52%|#####1 | 49/95 [00:22<00:21, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9635, LAS: 0.9327, UEM: 0.6392, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1691, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4635, loss: 0.5335, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 57%|#####6 | 54/95 [00:25<00:19, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9640, LAS: 0.9330, UEM: 0.6387, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2968, partial_loss/deprel_loss: 0.3182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5032, loss: 0.5312, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 62%|######2 | 59/95 [00:27<00:16, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9639, LAS: 0.9332, UEM: 0.6360, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.2927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4716, loss: 0.5308, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 67%|######7 | 64/95 [00:29<00:14, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9645, LAS: 0.9338, UEM: 0.6452, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1767, partial_loss/deprel_loss: 0.2089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3917, loss: 0.5265, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||: 73%|#######2 | 69/95 [00:32<00:12, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9644, LAS: 0.9336, UEM: 0.6536, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2759, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5375, loss: 0.5278, batch_reg_loss: 0.1892, reg_loss: 0.1894 ||: 78%|#######7 | 74/95 [00:34<00:10, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9649, LAS: 0.9342, UEM: 0.6632, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4438, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6031, loss: 0.5240, batch_reg_loss: 0.1892, reg_loss: 0.1894 ||: 83%|########3 | 79/95 [00:37<00:07, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9657, LAS: 0.9351, UEM: 0.6920, LEM: 0.4787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0267, partial_loss/deprel_loss: 0.1064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2796, loss: 0.5168, batch_reg_loss: 0.1892, reg_loss: 0.1893 ||: 88%|########8 | 84/95 [00:40<00:05, 1.98it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9653, LAS: 0.9348, UEM: 0.6902, LEM: 0.4779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.2646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.5183, batch_reg_loss: 0.1892, reg_loss: 0.1893 ||: 94%|#########3| 89/95 [00:42<00:03, 1.99it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9653, LAS: 0.9347, UEM: 0.6901, LEM: 0.4773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.2738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.5187, batch_reg_loss: 0.1891, reg_loss: 0.1893 ||: 99%|#########8| 94/95 [00:45<00:00, 2.00it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9652, LAS: 0.9346, UEM: 0.6877, LEM: 0.4753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4584, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.5194, batch_reg_loss: 0.1891, reg_loss: 0.1893 ||: 100%|##########| 95/95 [00:45<00:00, 2.09it/s]\n", + "2023-04-07 02:03:55,866 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - reg_loss | 0.189 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UEM | 0.688 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - LEM | 0.475 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.458 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UAS | 0.965 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.381 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - loss | 0.519 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - LAS | 0.935 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:03:55,873 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:04:00,656 - INFO - combo.training.trainer - Epoch duration: 0:00:53.410501\n", + "2023-04-07 02:04:00,657 - INFO - combo.training.trainer - Estimated training time remaining: 4:25:43\n", + "2023-04-07 02:04:00,657 - INFO - allennlp.training.trainer - Epoch 169/399\n", + "2023-04-07 02:04:00,657 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:04:00,658 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:04:00,667 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9698, LAS: 0.9411, UEM: 0.6418, LEM: 0.4026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2413, partial_loss/deprel_loss: 0.2945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4730, loss: 0.4935, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||: 5%|5 | 5/95 [00:02<00:38, 2.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9726, LAS: 0.9440, UEM: 0.7260, LEM: 0.5097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2509, partial_loss/deprel_loss: 0.2617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.4653, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||: 11%|# | 10/95 [00:04<00:37, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9677, LAS: 0.9380, UEM: 0.6683, LEM: 0.4510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.3501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5695, loss: 0.4984, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||: 16%|#5 | 15/95 [00:06<00:36, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9693, LAS: 0.9395, UEM: 0.6868, LEM: 0.4654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1516, partial_loss/deprel_loss: 0.2564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4245, loss: 0.4872, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||: 21%|##1 | 20/95 [00:09<00:34, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9687, LAS: 0.9386, UEM: 0.6907, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.2328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4929, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||: 26%|##6 | 25/95 [00:11<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9673, LAS: 0.9369, UEM: 0.6747, LEM: 0.4506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6361, partial_loss/deprel_loss: 0.4534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6790, loss: 0.5034, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||: 32%|###1 | 30/95 [00:13<00:29, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9654, LAS: 0.9351, UEM: 0.6693, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1109, partial_loss/deprel_loss: 0.2039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3743, loss: 0.5151, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||: 36%|###5 | 34/95 [00:15<00:28, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9640, LAS: 0.9335, UEM: 0.6648, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.5248, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||: 40%|#### | 38/95 [00:18<00:27, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9643, LAS: 0.9338, UEM: 0.6627, LEM: 0.4412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1614, partial_loss/deprel_loss: 0.2306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4058, loss: 0.5239, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||: 45%|####5 | 43/95 [00:20<00:24, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9639, LAS: 0.9334, UEM: 0.6678, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4158, partial_loss/deprel_loss: 0.3459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5489, loss: 0.5280, batch_reg_loss: 0.1890, reg_loss: 0.1890 ||: 51%|##### | 48/95 [00:22<00:23, 2.04it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9648, LAS: 0.9342, UEM: 0.6731, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1368, partial_loss/deprel_loss: 0.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4226, loss: 0.5226, batch_reg_loss: 0.1890, reg_loss: 0.1890 ||: 56%|#####5 | 53/95 [00:25<00:19, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9652, LAS: 0.9346, UEM: 0.6799, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.5194, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||: 61%|######1 | 58/95 [00:27<00:17, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9662, LAS: 0.9354, UEM: 0.6912, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1551, partial_loss/deprel_loss: 0.2573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.5132, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||: 66%|######6 | 63/95 [00:29<00:15, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9664, LAS: 0.9359, UEM: 0.7032, LEM: 0.4875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1846, partial_loss/deprel_loss: 0.2637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.5111, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||: 72%|#######1 | 68/95 [00:32<00:13, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9659, LAS: 0.9357, UEM: 0.6989, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1499, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.5120, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||: 77%|#######6 | 73/95 [00:35<00:10, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9665, LAS: 0.9364, UEM: 0.7073, LEM: 0.4957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.2823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.5077, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||: 82%|########2 | 78/95 [00:37<00:08, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9665, LAS: 0.9363, UEM: 0.7041, LEM: 0.4912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.3876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5988, loss: 0.5086, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||: 87%|########7 | 83/95 [00:39<00:05, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9661, LAS: 0.9360, UEM: 0.6966, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5800, partial_loss/deprel_loss: 0.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6172, loss: 0.5121, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||: 93%|#########2| 88/95 [00:42<00:03, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9664, LAS: 0.9362, UEM: 0.6986, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.5113, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||: 98%|#########7| 93/95 [00:44<00:00, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9663, LAS: 0.9362, UEM: 0.6948, LEM: 0.4785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3264, partial_loss/deprel_loss: 0.3409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.5126, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||: 100%|##########| 95/95 [00:45<00:00, 2.09it/s]\n", + "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer - reg_loss | 0.189 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UEM | 0.695 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LEM | 0.479 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EM | 0.942 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.326 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UAS | 0.966 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.341 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - loss | 0.513 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LAS | 0.936 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:04:48,874 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:04:52,934 - INFO - combo.training.trainer - Epoch duration: 0:00:52.276559\n", + "2023-04-07 02:04:52,934 - INFO - combo.training.trainer - Estimated training time remaining: 4:24:12\n", + "2023-04-07 02:04:52,934 - INFO - allennlp.training.trainer - Epoch 170/399\n", + "2023-04-07 02:04:52,934 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:04:52,935 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:04:52,943 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9684, LAS: 0.9376, UEM: 0.6909, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4841, partial_loss/deprel_loss: 0.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6174, loss: 0.5100, batch_reg_loss: 0.1888, reg_loss: 0.1888 ||: 5%|5 | 5/95 [00:02<00:39, 2.29it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9687, LAS: 0.9387, UEM: 0.6775, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.2755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4521, loss: 0.4978, batch_reg_loss: 0.1888, reg_loss: 0.1888 ||: 11%|# | 10/95 [00:04<00:36, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9715, LAS: 0.9419, UEM: 0.7333, LEM: 0.5131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1959, partial_loss/deprel_loss: 0.2153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.4725, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||: 16%|#5 | 15/95 [00:06<00:34, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9721, LAS: 0.9428, UEM: 0.7274, LEM: 0.5008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.4681, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||: 21%|##1 | 20/95 [00:08<00:32, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9698, LAS: 0.9406, UEM: 0.7019, LEM: 0.4749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.2651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.4841, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||: 26%|##6 | 25/95 [00:10<00:30, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9662, LAS: 0.9372, UEM: 0.6700, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6342, partial_loss/deprel_loss: 0.4175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.5039, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||: 32%|###1 | 30/95 [00:13<00:28, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9666, LAS: 0.9376, UEM: 0.6813, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1756, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4631, loss: 0.5028, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||: 37%|###6 | 35/95 [00:15<00:27, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9670, LAS: 0.9382, UEM: 0.6947, LEM: 0.4845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4920, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5534, loss: 0.4973, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||: 42%|####2 | 40/95 [00:17<00:24, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9678, LAS: 0.9391, UEM: 0.7201, LEM: 0.5218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6697, loss: 0.4923, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||: 47%|####7 | 45/95 [00:20<00:23, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9673, LAS: 0.9385, UEM: 0.7101, LEM: 0.5084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4554, partial_loss/deprel_loss: 0.3643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 0.4978, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||: 53%|#####2 | 50/95 [00:22<00:21, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9675, LAS: 0.9387, UEM: 0.7079, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0977, partial_loss/deprel_loss: 0.2086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3750, loss: 0.4944, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||: 58%|#####7 | 55/95 [00:25<00:19, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9660, LAS: 0.9371, UEM: 0.6921, LEM: 0.4913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0203, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7783, loss: 0.5049, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||: 63%|######3 | 60/95 [00:27<00:16, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9658, LAS: 0.9369, UEM: 0.6886, LEM: 0.4873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5424, partial_loss/deprel_loss: 0.4279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.5069, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||: 68%|######8 | 65/95 [00:30<00:14, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9658, LAS: 0.9368, UEM: 0.6917, LEM: 0.4884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1012, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3896, loss: 0.5079, batch_reg_loss: 0.1885, reg_loss: 0.1887 ||: 74%|#######3 | 70/95 [00:32<00:12, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9659, LAS: 0.9369, UEM: 0.6901, LEM: 0.4871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3690, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.5082, batch_reg_loss: 0.1885, reg_loss: 0.1887 ||: 78%|#######7 | 74/95 [00:34<00:10, 1.99it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9661, LAS: 0.9371, UEM: 0.6906, LEM: 0.4851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4746, loss: 0.5066, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 83%|########3 | 79/95 [00:37<00:08, 1.99it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9666, LAS: 0.9375, UEM: 0.6934, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1515, partial_loss/deprel_loss: 0.2274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4007, loss: 0.5043, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 88%|########8 | 84/95 [00:39<00:05, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9668, LAS: 0.9376, UEM: 0.6980, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3548, partial_loss/deprel_loss: 0.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.5031, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 94%|#########3| 89/95 [00:42<00:02, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9665, LAS: 0.9373, UEM: 0.6975, LEM: 0.4906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5044, loss: 0.5043, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 99%|#########8| 94/95 [00:44<00:00, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9665, LAS: 0.9373, UEM: 0.6966, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5168, loss: 0.5045, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 100%|##########| 95/95 [00:45<00:00, 2.11it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:05:41,112 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9606, LAS: 0.9147, UEM: 0.8017, LEM: 0.5895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2081, partial_loss/deprel_loss: 4.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7889, loss: 6.6149, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9545, LAS: 0.9051, UEM: 0.7521, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5775, partial_loss/deprel_loss: 16.9584, partial_loss/cycle_loss: 0.0000, batch_loss: 13.8822, loss: 7.3829, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 55%|#####4 | 6/11 [00:04<00:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9544, LAS: 0.9039, UEM: 0.7156, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2515, partial_loss/deprel_loss: 14.2445, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6459, loss: 7.2721, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 91%|######### | 10/11 [00:06<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9524, LAS: 0.9017, UEM: 0.6955, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0646, partial_loss/deprel_loss: 8.0247, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6326, loss: 7.2140, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.49it/s] \n", + "2023-04-07 02:05:48,501 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - reg_loss | 0.189 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UEM | 0.697 | 0.695\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - LEM | 0.489 | 0.424\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EM | 0.936 | 0.880\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.358 | 1.065\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UAS | 0.966 | 0.952\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.321 | 8.025\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - loss | 0.504 | 7.214\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - LAS | 0.937 | 0.902\n", + "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:05:48,508 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:05:53,326 - INFO - combo.training.trainer - Epoch duration: 0:01:00.392223\n", + "2023-04-07 02:05:53,327 - INFO - combo.training.trainer - Estimated training time remaining: 4:22:51\n", + "2023-04-07 02:05:53,327 - INFO - allennlp.training.trainer - Epoch 171/399\n", + "2023-04-07 02:05:53,328 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:05:53,328 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:05:53,338 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9800, UAS: 0.9725, LAS: 0.9501, UEM: 0.9113, LEM: 0.8424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0207, partial_loss/deprel_loss: 0.0859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2613, loss: 0.4325, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||: 2%|2 | 2/95 [00:03<02:36, 1.68s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9683, LAS: 0.9401, UEM: 0.8034, LEM: 0.6626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.2525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4174, loss: 0.4835, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||: 7%|7 | 7/95 [00:05<01:55, 1.31s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9652, LAS: 0.9365, UEM: 0.7790, LEM: 0.6240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1633, partial_loss/deprel_loss: 0.2132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.4996, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||: 12%|#1 | 11/95 [00:07<01:30, 1.08s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9678, LAS: 0.9386, UEM: 0.7664, LEM: 0.5865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1950, partial_loss/deprel_loss: 0.2914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4872, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||: 17%|#6 | 16/95 [00:09<01:09, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9692, LAS: 0.9398, UEM: 0.7505, LEM: 0.5586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4056, loss: 0.4809, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||: 22%|##2 | 21/95 [00:12<00:56, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9704, LAS: 0.9406, UEM: 0.7493, LEM: 0.5435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1785, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4323, loss: 0.4747, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||: 27%|##7 | 26/95 [00:14<00:45, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9703, LAS: 0.9406, UEM: 0.7494, LEM: 0.5445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1113, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3643, loss: 0.4752, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||: 32%|###1 | 30/95 [00:16<00:40, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9696, LAS: 0.9397, UEM: 0.7372, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2091, partial_loss/deprel_loss: 0.2668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4435, loss: 0.4816, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||: 36%|###5 | 34/95 [00:18<00:36, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9700, LAS: 0.9400, UEM: 0.7325, LEM: 0.5208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5241, loss: 0.4803, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||: 41%|####1 | 39/95 [00:21<00:30, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9699, LAS: 0.9401, UEM: 0.7327, LEM: 0.5236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3314, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5494, loss: 0.4811, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||: 45%|####5 | 43/95 [00:23<00:28, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9691, LAS: 0.9394, UEM: 0.7168, LEM: 0.5071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.4881, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 51%|##### | 48/95 [00:25<00:24, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9694, LAS: 0.9400, UEM: 0.7222, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0995, partial_loss/deprel_loss: 0.1760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3489, loss: 0.4851, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 56%|#####5 | 53/95 [00:27<00:21, 1.95it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9689, LAS: 0.9395, UEM: 0.7107, LEM: 0.5024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2013, partial_loss/deprel_loss: 0.2850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4883, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 61%|######1 | 58/95 [00:30<00:18, 1.97it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9689, LAS: 0.9396, UEM: 0.7063, LEM: 0.4967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4276, loss: 0.4874, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 66%|######6 | 63/95 [00:32<00:15, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9685, LAS: 0.9392, UEM: 0.7010, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4787, partial_loss/deprel_loss: 0.4124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.4897, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 72%|#######1 | 68/95 [00:35<00:13, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9688, LAS: 0.9393, UEM: 0.7078, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4541, partial_loss/deprel_loss: 0.3486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5579, loss: 0.4890, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||: 77%|#######6 | 73/95 [00:37<00:10, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9535, UAS: 0.9681, LAS: 0.9388, UEM: 0.6992, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2062, partial_loss/deprel_loss: 0.2743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.4939, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 82%|########2 | 78/95 [00:39<00:07, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9680, LAS: 0.9386, UEM: 0.6943, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5463, partial_loss/deprel_loss: 0.4094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6249, loss: 0.4966, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 87%|########7 | 83/95 [00:41<00:05, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9679, LAS: 0.9386, UEM: 0.6982, LEM: 0.4858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3599, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.4961, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 93%|#########2| 88/95 [00:44<00:03, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9669, LAS: 0.9376, UEM: 0.6929, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4144, loss: 0.5021, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 98%|#########7| 93/95 [00:46<00:00, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9612, UAS: 0.9671, LAS: 0.9378, UEM: 0.6992, LEM: 0.4909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0732, partial_loss/deprel_loss: 0.1482, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3213, loss: 0.5004, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 100%|##########| 95/95 [00:47<00:00, 1.99it/s]\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - reg_loss | 0.188 | N/A\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - UEM | 0.699 | N/A\n", + "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - LEM | 0.491 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - EM | 0.961 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.073 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - UAS | 0.967 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.148 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - loss | 0.500 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - LAS | 0.938 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:06:43,864 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:06:48,563 - INFO - combo.training.trainer - Epoch duration: 0:00:55.235260\n", + "2023-04-07 02:06:48,563 - INFO - combo.training.trainer - Estimated training time remaining: 4:21:24\n", + "2023-04-07 02:06:48,563 - INFO - allennlp.training.trainer - Epoch 172/399\n", + "2023-04-07 02:06:48,564 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:06:48,564 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:06:48,574 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9654, LAS: 0.9351, UEM: 0.6406, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5035, loss: 0.5067, batch_reg_loss: 0.1881, reg_loss: 0.1881 ||: 4%|4 | 4/95 [00:02<00:46, 1.94it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9668, LAS: 0.9381, UEM: 0.7154, LEM: 0.5356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2848, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4606, loss: 0.4873, batch_reg_loss: 0.1881, reg_loss: 0.1881 ||: 8%|8 | 8/95 [00:04<00:44, 1.94it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9678, LAS: 0.9385, UEM: 0.6907, LEM: 0.4949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1446, partial_loss/deprel_loss: 0.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4125, loss: 0.4866, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||: 14%|#3 | 13/95 [00:06<00:40, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9687, LAS: 0.9392, UEM: 0.6788, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.4863, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||: 19%|#8 | 18/95 [00:08<00:37, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9653, LAS: 0.9356, UEM: 0.6687, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0776, partial_loss/deprel_loss: 0.6299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9074, loss: 0.5121, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||: 23%|##3 | 22/95 [00:10<00:36, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9662, LAS: 0.9369, UEM: 0.6886, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.2678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4280, loss: 0.5059, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 28%|##8 | 27/95 [00:13<00:33, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9663, LAS: 0.9369, UEM: 0.6907, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1518, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4266, loss: 0.5073, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 33%|###2 | 31/95 [00:15<00:31, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9651, LAS: 0.9357, UEM: 0.6733, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4089, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.5143, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 38%|###7 | 36/95 [00:17<00:28, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9538, UAS: 0.9654, LAS: 0.9361, UEM: 0.6825, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1190, partial_loss/deprel_loss: 0.2261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3926, loss: 0.5107, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||: 42%|####2 | 40/95 [00:19<00:27, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9653, LAS: 0.9361, UEM: 0.6749, LEM: 0.4693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2404, partial_loss/deprel_loss: 0.2831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.5092, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 47%|####7 | 45/95 [00:21<00:23, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9657, LAS: 0.9362, UEM: 0.6765, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2225, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.5081, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 53%|#####2 | 50/95 [00:23<00:21, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9660, LAS: 0.9366, UEM: 0.6709, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.2366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4173, loss: 0.5059, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 58%|#####7 | 55/95 [00:26<00:18, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9659, LAS: 0.9366, UEM: 0.6683, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4734, loss: 0.5053, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 63%|######3 | 60/95 [00:28<00:15, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9764, UAS: 0.9665, LAS: 0.9373, UEM: 0.6924, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0326, partial_loss/deprel_loss: 0.0888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2654, loss: 0.5009, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 68%|######8 | 65/95 [00:30<00:14, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9665, LAS: 0.9375, UEM: 0.6984, LEM: 0.4983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.2718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4355, loss: 0.4997, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||: 74%|#######3 | 70/95 [00:33<00:12, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9665, LAS: 0.9376, UEM: 0.6949, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7259, loss: 0.5003, batch_reg_loss: 0.1878, reg_loss: 0.1880 ||: 79%|#######8 | 75/95 [00:35<00:09, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9662, LAS: 0.9372, UEM: 0.6853, LEM: 0.4833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4882, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6266, loss: 0.5023, batch_reg_loss: 0.1878, reg_loss: 0.1880 ||: 84%|########4 | 80/95 [00:37<00:06, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9665, LAS: 0.9373, UEM: 0.6917, LEM: 0.4898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4786, loss: 0.5004, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 89%|########9 | 85/95 [00:40<00:04, 2.14it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9665, LAS: 0.9373, UEM: 0.6970, LEM: 0.4944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.5000, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 95%|#########4| 90/95 [00:42<00:02, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9666, LAS: 0.9374, UEM: 0.6953, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5184, loss: 0.4993, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 100%|##########| 95/95 [00:45<00:00, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9666, LAS: 0.9374, UEM: 0.6953, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5184, loss: 0.4993, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 100%|##########| 95/95 [00:45<00:00, 2.11it/s]\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - reg_loss | 0.188 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UEM | 0.695 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LEM | 0.492 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EM | 0.938 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.302 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UAS | 0.967 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.338 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - loss | 0.499 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LAS | 0.937 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:07:36,069 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:07:36,072 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:07:39,884 - INFO - combo.training.trainer - Epoch duration: 0:00:51.320842\n", + "2023-04-07 02:07:39,885 - INFO - combo.training.trainer - Estimated training time remaining: 4:19:53\n", + "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - Epoch 173/399\n", + "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:07:39,894 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9668, LAS: 0.9351, UEM: 0.7266, LEM: 0.5045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1379, partial_loss/deprel_loss: 0.2552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.5019, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||: 5%|5 | 5/95 [00:02<00:45, 1.98it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9691, LAS: 0.9388, UEM: 0.6967, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2543, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.4870, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||: 11%|# | 10/95 [00:04<00:41, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9680, LAS: 0.9385, UEM: 0.6448, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2867, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.4966, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||: 16%|#5 | 15/95 [00:07<00:38, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9652, LAS: 0.9361, UEM: 0.6765, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0895, partial_loss/deprel_loss: 0.1832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3521, loss: 0.5077, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||: 21%|##1 | 20/95 [00:09<00:35, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9654, LAS: 0.9368, UEM: 0.6994, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6584, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.5024, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||: 26%|##6 | 25/95 [00:11<00:33, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9669, LAS: 0.9382, UEM: 0.7003, LEM: 0.5003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3080, partial_loss/deprel_loss: 0.2853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4775, loss: 0.4950, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||: 32%|###1 | 30/95 [00:13<00:29, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9671, LAS: 0.9384, UEM: 0.6968, LEM: 0.4940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3844, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.4927, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||: 37%|###6 | 35/95 [00:16<00:28, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9666, LAS: 0.9376, UEM: 0.6920, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9114, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7207, loss: 0.4980, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||: 42%|####2 | 40/95 [00:18<00:25, 2.13it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9680, LAS: 0.9396, UEM: 0.7289, LEM: 0.5380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.2103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3866, loss: 0.4856, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||: 47%|####7 | 45/95 [00:21<00:24, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9686, LAS: 0.9401, UEM: 0.7335, LEM: 0.5403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4065, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5535, loss: 0.4817, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||: 53%|#####2 | 50/95 [00:23<00:21, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9686, LAS: 0.9400, UEM: 0.7342, LEM: 0.5408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.2988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.4833, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||: 58%|#####7 | 55/95 [00:26<00:19, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9679, LAS: 0.9392, UEM: 0.7241, LEM: 0.5296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0444, partial_loss/deprel_loss: 0.4688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7715, loss: 0.4892, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||: 63%|######3 | 60/95 [00:28<00:16, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9678, LAS: 0.9390, UEM: 0.7198, LEM: 0.5223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4509, partial_loss/deprel_loss: 0.3862, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5867, loss: 0.4908, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||: 68%|######8 | 65/95 [00:30<00:13, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9674, LAS: 0.9387, UEM: 0.7102, LEM: 0.5122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2441, partial_loss/deprel_loss: 0.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.4921, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||: 74%|#######3 | 70/95 [00:33<00:11, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9668, LAS: 0.9379, UEM: 0.7007, LEM: 0.5021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7125, partial_loss/deprel_loss: 0.4865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.4986, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||: 79%|#######8 | 75/95 [00:35<00:09, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9674, LAS: 0.9383, UEM: 0.7049, LEM: 0.5035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1480, partial_loss/deprel_loss: 0.3090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.4961, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 84%|########4 | 80/95 [00:37<00:07, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9675, LAS: 0.9383, UEM: 0.7038, LEM: 0.5023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1645, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.4957, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 89%|########9 | 85/95 [00:40<00:04, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9676, LAS: 0.9384, UEM: 0.7036, LEM: 0.4999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2718, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.4949, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 95%|#########4| 90/95 [00:42<00:02, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9674, LAS: 0.9380, UEM: 0.6967, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3628, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5687, loss: 0.4976, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 100%|##########| 95/95 [00:44<00:00, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9674, LAS: 0.9380, UEM: 0.6967, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3628, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5687, loss: 0.4976, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 100%|##########| 95/95 [00:44<00:00, 2.12it/s]\n", + "2023-04-07 02:08:27,737 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - reg_loss | 0.188 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UEM | 0.697 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - LEM | 0.492 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EM | 0.923 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.363 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UAS | 0.967 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.386 | N/A\n", + "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - loss | 0.498 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - LAS | 0.938 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.845 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:08:27,744 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:08:32,237 - INFO - combo.training.trainer - Epoch duration: 0:00:52.352574\n", + "2023-04-07 02:08:32,238 - INFO - combo.training.trainer - Estimated training time remaining: 4:18:23\n", + "2023-04-07 02:08:32,238 - INFO - allennlp.training.trainer - Epoch 174/399\n", + "2023-04-07 02:08:32,238 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:08:32,239 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:08:32,250 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9754, LAS: 0.9467, UEM: 0.7662, LEM: 0.5495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0672, partial_loss/deprel_loss: 0.1893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3522, loss: 0.4420, batch_reg_loss: 0.1874, reg_loss: 0.1874 ||: 5%|5 | 5/95 [00:02<00:42, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9713, LAS: 0.9423, UEM: 0.7106, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4549, loss: 0.4666, batch_reg_loss: 0.1874, reg_loss: 0.1874 ||: 11%|# | 10/95 [00:04<00:40, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9706, LAS: 0.9419, UEM: 0.6911, LEM: 0.4658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2233, partial_loss/deprel_loss: 0.2813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4570, loss: 0.4739, batch_reg_loss: 0.1873, reg_loss: 0.1874 ||: 16%|#5 | 15/95 [00:06<00:37, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9699, LAS: 0.9412, UEM: 0.6877, LEM: 0.4705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3466, partial_loss/deprel_loss: 0.3447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5324, loss: 0.4771, batch_reg_loss: 0.1873, reg_loss: 0.1874 ||: 21%|##1 | 20/95 [00:09<00:35, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9690, LAS: 0.9393, UEM: 0.7068, LEM: 0.4927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7900, partial_loss/deprel_loss: 0.4784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7280, loss: 0.4828, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||: 26%|##6 | 25/95 [00:11<00:33, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9658, LAS: 0.9361, UEM: 0.6803, LEM: 0.4683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8419, partial_loss/deprel_loss: 0.5101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7638, loss: 0.5070, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||: 32%|###1 | 30/95 [00:14<00:31, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9554, UAS: 0.9666, LAS: 0.9369, UEM: 0.6862, LEM: 0.4727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1228, partial_loss/deprel_loss: 0.2493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4113, loss: 0.5049, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||: 36%|###5 | 34/95 [00:16<00:29, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9661, LAS: 0.9365, UEM: 0.6719, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4983, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5741, loss: 0.5089, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||: 40%|#### | 38/95 [00:18<00:28, 2.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9666, LAS: 0.9373, UEM: 0.6827, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1798, partial_loss/deprel_loss: 0.2568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4286, loss: 0.5011, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||: 45%|####5 | 43/95 [00:20<00:25, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9667, LAS: 0.9374, UEM: 0.6793, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4999, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||: 51%|##### | 48/95 [00:23<00:22, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9663, LAS: 0.9371, UEM: 0.6693, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3065, partial_loss/deprel_loss: 0.3364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5176, loss: 0.5033, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||: 56%|#####5 | 53/95 [00:25<00:20, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9667, LAS: 0.9375, UEM: 0.6694, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.2654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4502, loss: 0.4998, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||: 61%|######1 | 58/95 [00:27<00:17, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9672, LAS: 0.9381, UEM: 0.6852, LEM: 0.4772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0324, partial_loss/deprel_loss: 0.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2735, loss: 0.4956, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||: 66%|######6 | 63/95 [00:30<00:15, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9675, LAS: 0.9383, UEM: 0.6916, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1398, partial_loss/deprel_loss: 0.2216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3924, loss: 0.4931, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||: 72%|#######1 | 68/95 [00:32<00:12, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9673, LAS: 0.9384, UEM: 0.6854, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5172, loss: 0.4935, batch_reg_loss: 0.1871, reg_loss: 0.1873 ||: 77%|#######6 | 73/95 [00:34<00:10, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9451, UAS: 0.9668, LAS: 0.9379, UEM: 0.6789, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1879, partial_loss/deprel_loss: 0.2809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.4964, batch_reg_loss: 0.1871, reg_loss: 0.1873 ||: 82%|########2 | 78/95 [00:37<00:08, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9669, LAS: 0.9381, UEM: 0.6832, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3689, partial_loss/deprel_loss: 0.3222, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5186, loss: 0.4952, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||: 87%|########7 | 83/95 [00:39<00:05, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9676, LAS: 0.9388, UEM: 0.6984, LEM: 0.4952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0900, partial_loss/deprel_loss: 0.1902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3573, loss: 0.4903, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||: 93%|#########2| 88/95 [00:42<00:03, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9680, LAS: 0.9391, UEM: 0.7009, LEM: 0.4951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.4885, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||: 98%|#########7| 93/95 [00:44<00:00, 2.07it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9677, LAS: 0.9389, UEM: 0.6975, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.2698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4672, loss: 0.4900, batch_reg_loss: 0.1870, reg_loss: 0.1872 ||: 100%|##########| 95/95 [00:45<00:00, 2.09it/s]\n", + "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - reg_loss | 0.187 | N/A\n", + "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UEM | 0.697 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LEM | 0.492 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - EM | 0.945 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.321 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UAS | 0.968 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.270 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - loss | 0.490 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LAS | 0.939 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:09:20,945 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:09:25,709 - INFO - combo.training.trainer - Epoch duration: 0:00:53.471397\n", + "2023-04-07 02:09:25,710 - INFO - combo.training.trainer - Estimated training time remaining: 4:16:55\n", + "2023-04-07 02:09:25,710 - INFO - allennlp.training.trainer - Epoch 175/399\n", + "2023-04-07 02:09:25,710 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:09:25,711 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:09:25,720 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9662, LAS: 0.9369, UEM: 0.7409, LEM: 0.5371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.2315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3982, loss: 0.4858, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||: 5%|5 | 5/95 [00:02<00:43, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9621, LAS: 0.9336, UEM: 0.6399, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.2733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4495, loss: 0.5212, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||: 11%|# | 10/95 [00:04<00:40, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9637, LAS: 0.9356, UEM: 0.6253, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5335, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.5136, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||: 15%|#4 | 14/95 [00:06<00:39, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9643, LAS: 0.9366, UEM: 0.6265, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2836, partial_loss/deprel_loss: 0.3064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.5072, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||: 20%|## | 19/95 [00:09<00:36, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9650, LAS: 0.9375, UEM: 0.6447, LEM: 0.4437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.4992, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||: 25%|##5 | 24/95 [00:11<00:33, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9668, LAS: 0.9390, UEM: 0.6874, LEM: 0.4897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2737, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.4892, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 31%|### | 29/95 [00:13<00:31, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9667, LAS: 0.9385, UEM: 0.6772, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3763, partial_loss/deprel_loss: 0.3628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.4919, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 36%|###5 | 34/95 [00:16<00:28, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9664, LAS: 0.9384, UEM: 0.6660, LEM: 0.4586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3088, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.4938, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 41%|####1 | 39/95 [00:18<00:25, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9668, LAS: 0.9387, UEM: 0.6746, LEM: 0.4676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.2160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3886, loss: 0.4902, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 46%|####6 | 44/95 [00:20<00:23, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9672, LAS: 0.9391, UEM: 0.6930, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1267, partial_loss/deprel_loss: 0.2429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4065, loss: 0.4877, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 52%|#####1 | 49/95 [00:23<00:21, 2.10it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9553, UAS: 0.9665, LAS: 0.9385, UEM: 0.6856, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1364, partial_loss/deprel_loss: 0.2059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3788, loss: 0.4915, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||: 57%|#####6 | 54/95 [00:25<00:19, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9659, LAS: 0.9379, UEM: 0.6728, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3806, partial_loss/deprel_loss: 0.3239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.4978, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||: 62%|######2 | 59/95 [00:27<00:16, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9665, LAS: 0.9384, UEM: 0.6843, LEM: 0.4827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.1964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3696, loss: 0.4941, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||: 67%|######7 | 64/95 [00:30<00:14, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9666, LAS: 0.9384, UEM: 0.6792, LEM: 0.4764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3055, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5591, loss: 0.4943, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||: 73%|#######2 | 69/95 [00:32<00:11, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9672, LAS: 0.9389, UEM: 0.6884, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1952, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4904, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||: 78%|#######7 | 74/95 [00:34<00:09, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9667, LAS: 0.9385, UEM: 0.6771, LEM: 0.4741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4252, partial_loss/deprel_loss: 0.3328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5380, loss: 0.4942, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||: 83%|########3 | 79/95 [00:37<00:07, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9668, LAS: 0.9387, UEM: 0.6865, LEM: 0.4900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1773, partial_loss/deprel_loss: 0.2759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.4927, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||: 88%|########8 | 84/95 [00:39<00:05, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9676, LAS: 0.9392, UEM: 0.7002, LEM: 0.4987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1410, partial_loss/deprel_loss: 0.2602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4231, loss: 0.4887, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||: 94%|#########3| 89/95 [00:42<00:02, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9678, LAS: 0.9395, UEM: 0.7012, LEM: 0.4997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0891, partial_loss/deprel_loss: 0.2031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3670, loss: 0.4872, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||: 99%|#########8| 94/95 [00:44<00:00, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9676, LAS: 0.9393, UEM: 0.6989, LEM: 0.4977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5695, partial_loss/deprel_loss: 0.3864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6098, loss: 0.4885, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||: 100%|##########| 95/95 [00:44<00:00, 2.11it/s]\n", + "2023-04-07 02:10:13,809 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9487, LAS: 0.8983, UEM: 0.6867, LEM: 0.4739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0548, partial_loss/deprel_loss: 8.0360, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6398, loss: 7.0117, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:02<00:04, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9503, LAS: 0.9017, UEM: 0.7040, LEM: 0.4726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5264, partial_loss/deprel_loss: 16.6715, partial_loss/cycle_loss: 0.0000, batch_loss: 13.6425, loss: 7.3681, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:04<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9518, LAS: 0.9014, UEM: 0.6831, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5225, partial_loss/deprel_loss: 7.1535, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8273, loss: 7.1744, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.51it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9518, LAS: 0.9014, UEM: 0.6831, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5225, partial_loss/deprel_loss: 7.1535, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8273, loss: 7.1744, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.50it/s]\n", + "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer - reg_loss | 0.187 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UEM | 0.699 | 0.683\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LEM | 0.498 | 0.415\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EM | 0.920 | 0.905\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.570 | 0.523\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UAS | 0.968 | 0.952\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.386 | 7.153\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - loss | 0.489 | 7.174\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LAS | 0.939 | 0.901\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:10:21,135 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:10:21,135 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:10:21,139 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:10:25,839 - INFO - combo.training.trainer - Epoch duration: 0:01:00.129085\n", + "2023-04-07 02:10:25,840 - INFO - combo.training.trainer - Estimated training time remaining: 4:15:35\n", + "2023-04-07 02:10:25,840 - INFO - allennlp.training.trainer - Epoch 176/399\n", + "2023-04-07 02:10:25,840 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:10:25,841 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:10:25,850 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9736, LAS: 0.9421, UEM: 0.7172, LEM: 0.4547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2733, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.4643, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||: 5%|5 | 5/95 [00:02<00:38, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9735, LAS: 0.9443, UEM: 0.7156, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1517, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.4558, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||: 11%|# | 10/95 [00:04<00:36, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9701, LAS: 0.9417, UEM: 0.7079, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.2318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3994, loss: 0.4714, batch_reg_loss: 0.1866, reg_loss: 0.1867 ||: 16%|#5 | 15/95 [00:06<00:36, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9689, LAS: 0.9400, UEM: 0.6964, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5728, partial_loss/deprel_loss: 0.3881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6117, loss: 0.4803, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||: 21%|##1 | 20/95 [00:09<00:34, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9700, LAS: 0.9414, UEM: 0.7148, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0880, partial_loss/deprel_loss: 0.1952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3603, loss: 0.4688, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||: 26%|##6 | 25/95 [00:11<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9701, LAS: 0.9414, UEM: 0.7079, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0996, partial_loss/deprel_loss: 0.2304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3908, loss: 0.4698, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||: 32%|###1 | 30/95 [00:13<00:28, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9710, LAS: 0.9429, UEM: 0.7498, LEM: 0.5551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.1781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3574, loss: 0.4600, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||: 36%|###5 | 34/95 [00:15<00:29, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9702, LAS: 0.9423, UEM: 0.7355, LEM: 0.5374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5495, partial_loss/deprel_loss: 0.3517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.4654, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||: 41%|####1 | 39/95 [00:18<00:26, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9703, LAS: 0.9422, UEM: 0.7315, LEM: 0.5286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4231, partial_loss/deprel_loss: 0.3928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.4662, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||: 45%|####5 | 43/95 [00:20<00:25, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9705, LAS: 0.9425, UEM: 0.7315, LEM: 0.5290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0979, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3712, loss: 0.4664, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||: 51%|##### | 48/95 [00:22<00:22, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9698, LAS: 0.9417, UEM: 0.7230, LEM: 0.5194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5247, partial_loss/deprel_loss: 0.3651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.4715, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||: 56%|#####5 | 53/95 [00:24<00:19, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9483, UAS: 0.9694, LAS: 0.9411, UEM: 0.7197, LEM: 0.5139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1925, partial_loss/deprel_loss: 0.3408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.4757, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||: 61%|######1 | 58/95 [00:27<00:17, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9694, LAS: 0.9412, UEM: 0.7165, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4799, loss: 0.4759, batch_reg_loss: 0.1864, reg_loss: 0.1866 ||: 66%|######6 | 63/95 [00:29<00:15, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9693, LAS: 0.9412, UEM: 0.7166, LEM: 0.5146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0665, partial_loss/deprel_loss: 0.1377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3099, loss: 0.4770, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||: 72%|#######1 | 68/95 [00:31<00:12, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9691, LAS: 0.9411, UEM: 0.7162, LEM: 0.5155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7586, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7201, loss: 0.4784, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||: 77%|#######6 | 73/95 [00:34<00:10, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9689, LAS: 0.9408, UEM: 0.7165, LEM: 0.5143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9787, partial_loss/deprel_loss: 0.5288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8052, loss: 0.4813, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||: 82%|########2 | 78/95 [00:36<00:08, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9686, LAS: 0.9405, UEM: 0.7123, LEM: 0.5082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.4826, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||: 87%|########7 | 83/95 [00:38<00:05, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9681, LAS: 0.9400, UEM: 0.7034, LEM: 0.4989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2496, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4858, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||: 93%|#########2| 88/95 [00:41<00:03, 2.14it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9684, LAS: 0.9402, UEM: 0.7072, LEM: 0.5033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.4848, batch_reg_loss: 0.1863, reg_loss: 0.1865 ||: 98%|#########7| 93/95 [00:43<00:00, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9683, LAS: 0.9401, UEM: 0.7039, LEM: 0.4996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3500, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.4860, batch_reg_loss: 0.1863, reg_loss: 0.1865 ||: 100%|##########| 95/95 [00:44<00:00, 2.13it/s]\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - reg_loss | 0.187 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UEM | 0.704 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - LEM | 0.500 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EM | 0.941 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.350 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UAS | 0.968 | N/A\n", + "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.314 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - loss | 0.486 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - LAS | 0.940 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:11:13,585 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:11:18,407 - INFO - combo.training.trainer - Epoch duration: 0:00:52.567475\n", + "2023-04-07 02:11:18,408 - INFO - combo.training.trainer - Estimated training time remaining: 4:14:07\n", + "2023-04-07 02:11:18,408 - INFO - allennlp.training.trainer - Epoch 177/399\n", + "2023-04-07 02:11:18,408 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:11:18,409 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:11:18,417 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9532, UAS: 0.9691, LAS: 0.9429, UEM: 0.7046, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.4576, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||: 5%|5 | 5/95 [00:02<00:38, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9739, LAS: 0.9472, UEM: 0.7883, LEM: 0.5924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3798, loss: 0.4267, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||: 11%|# | 10/95 [00:04<00:38, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9735, LAS: 0.9456, UEM: 0.7580, LEM: 0.5463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1520, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3999, loss: 0.4449, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||: 16%|#5 | 15/95 [00:07<00:36, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9725, LAS: 0.9443, UEM: 0.7376, LEM: 0.5214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.2340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4530, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||: 21%|##1 | 20/95 [00:09<00:33, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9734, LAS: 0.9455, UEM: 0.7734, LEM: 0.5827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0992, partial_loss/deprel_loss: 0.1703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3423, loss: 0.4430, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||: 25%|##5 | 24/95 [00:11<00:33, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9715, LAS: 0.9437, UEM: 0.7634, LEM: 0.5770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.3644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.4542, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||: 29%|##9 | 28/95 [00:13<00:32, 2.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9719, LAS: 0.9438, UEM: 0.7596, LEM: 0.5644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3942, loss: 0.4535, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||: 36%|###5 | 34/95 [00:15<00:28, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9712, LAS: 0.9433, UEM: 0.7448, LEM: 0.5488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3113, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.4607, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||: 41%|####1 | 39/95 [00:17<00:25, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9700, LAS: 0.9424, UEM: 0.7470, LEM: 0.5602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1133, partial_loss/deprel_loss: 0.2004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3691, loss: 0.4649, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||: 46%|####6 | 44/95 [00:20<00:23, 2.18it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9695, LAS: 0.9418, UEM: 0.7385, LEM: 0.5475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6892, partial_loss/deprel_loss: 0.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6919, loss: 0.4696, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 52%|#####1 | 49/95 [00:22<00:20, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9682, LAS: 0.9405, UEM: 0.7245, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9134, partial_loss/deprel_loss: 0.4578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7351, loss: 0.4782, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 57%|#####6 | 54/95 [00:24<00:18, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9683, LAS: 0.9404, UEM: 0.7213, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.3174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4933, loss: 0.4771, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 63%|######3 | 60/95 [00:26<00:15, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9686, LAS: 0.9406, UEM: 0.7199, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4390, loss: 0.4748, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 68%|######8 | 65/95 [00:29<00:13, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9686, LAS: 0.9405, UEM: 0.7183, LEM: 0.5185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1395, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4030, loss: 0.4750, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9676, LAS: 0.9396, UEM: 0.7092, LEM: 0.5094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5968, loss: 0.4827, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||: 79%|#######8 | 75/95 [00:33<00:09, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9671, LAS: 0.9389, UEM: 0.6995, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4870, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 84%|########4 | 80/95 [00:36<00:06, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9674, LAS: 0.9394, UEM: 0.6988, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2487, partial_loss/deprel_loss: 0.2758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4565, loss: 0.4839, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 89%|########9 | 85/95 [00:38<00:04, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9675, LAS: 0.9393, UEM: 0.6969, LEM: 0.4925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0929, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3971, loss: 0.4851, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 95%|#########4| 90/95 [00:40<00:02, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9675, LAS: 0.9391, UEM: 0.6996, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.4848, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 100%|##########| 95/95 [00:42<00:00, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9675, LAS: 0.9391, UEM: 0.6996, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.4848, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 100%|##########| 95/95 [00:42<00:00, 2.22it/s]\n", + "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - reg_loss | 0.186 | N/A\n", + "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UEM | 0.700 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LEM | 0.496 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - EM | 0.929 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.397 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UAS | 0.968 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.308 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - loss | 0.485 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LAS | 0.939 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:04,422 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:12:09,262 - INFO - combo.training.trainer - Epoch duration: 0:00:50.853596\n", + "2023-04-07 02:12:09,262 - INFO - combo.training.trainer - Estimated training time remaining: 4:12:37\n", + "2023-04-07 02:12:09,262 - INFO - allennlp.training.trainer - Epoch 178/399\n", + "2023-04-07 02:12:09,263 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:12:09,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:12:09,271 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9771, LAS: 0.9459, UEM: 0.8007, LEM: 0.5751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0742, partial_loss/deprel_loss: 0.1687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.4355, batch_reg_loss: 0.1860, reg_loss: 0.1860 ||: 5%|5 | 5/95 [00:02<00:41, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9691, LAS: 0.9408, UEM: 0.7053, LEM: 0.4880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7240, partial_loss/deprel_loss: 0.3619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.4856, batch_reg_loss: 0.1860, reg_loss: 0.1860 ||: 11%|# | 10/95 [00:04<00:39, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9661, LAS: 0.9379, UEM: 0.6407, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2132, partial_loss/deprel_loss: 0.2303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4128, loss: 0.4981, batch_reg_loss: 0.1859, reg_loss: 0.1860 ||: 16%|#5 | 15/95 [00:06<00:36, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9692, LAS: 0.9409, UEM: 0.7156, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1023, partial_loss/deprel_loss: 0.2382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3970, loss: 0.4764, batch_reg_loss: 0.1859, reg_loss: 0.1860 ||: 21%|##1 | 20/95 [00:09<00:34, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9672, LAS: 0.9391, UEM: 0.6871, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.3675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5795, loss: 0.4870, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||: 26%|##6 | 25/95 [00:11<00:31, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9564, UAS: 0.9672, LAS: 0.9392, UEM: 0.7025, LEM: 0.4973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1483, partial_loss/deprel_loss: 0.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3956, loss: 0.4867, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||: 31%|### | 29/95 [00:13<00:31, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9682, LAS: 0.9402, UEM: 0.7164, LEM: 0.5110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0899, partial_loss/deprel_loss: 0.2149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3757, loss: 0.4796, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||: 35%|###4 | 33/95 [00:15<00:30, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9676, LAS: 0.9394, UEM: 0.7095, LEM: 0.5035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2311, partial_loss/deprel_loss: 0.2782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.4861, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||: 40%|#### | 38/95 [00:17<00:27, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9664, LAS: 0.9381, UEM: 0.6917, LEM: 0.4876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3869, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5643, loss: 0.4963, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 44%|####4 | 42/95 [00:19<00:25, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9671, LAS: 0.9385, UEM: 0.6923, LEM: 0.4830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.2968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4664, loss: 0.4938, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 49%|####9 | 47/95 [00:21<00:22, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9676, LAS: 0.9390, UEM: 0.7013, LEM: 0.4943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0641, partial_loss/deprel_loss: 0.1436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3135, loss: 0.4904, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 55%|#####4 | 52/95 [00:23<00:19, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9677, LAS: 0.9387, UEM: 0.6950, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.4918, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 60%|###### | 57/95 [00:26<00:17, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9678, LAS: 0.9390, UEM: 0.6928, LEM: 0.4797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1609, partial_loss/deprel_loss: 0.2728, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4362, loss: 0.4911, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 65%|######5 | 62/95 [00:28<00:14, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9684, LAS: 0.9397, UEM: 0.6997, LEM: 0.4862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.2146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3997, loss: 0.4859, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||: 71%|####### | 67/95 [00:30<00:12, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9680, LAS: 0.9391, UEM: 0.6943, LEM: 0.4817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6043, loss: 0.4896, batch_reg_loss: 0.1857, reg_loss: 0.1859 ||: 76%|#######5 | 72/95 [00:32<00:10, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9681, LAS: 0.9392, UEM: 0.6975, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5883, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5905, loss: 0.4893, batch_reg_loss: 0.1857, reg_loss: 0.1859 ||: 81%|########1 | 77/95 [00:35<00:08, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9686, LAS: 0.9400, UEM: 0.7131, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.4845, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||: 86%|########6 | 82/95 [00:37<00:05, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9687, LAS: 0.9400, UEM: 0.7106, LEM: 0.5041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4571, loss: 0.4844, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||: 92%|#########1| 87/95 [00:39<00:03, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9688, LAS: 0.9402, UEM: 0.7071, LEM: 0.4997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.2632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.4833, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||: 97%|#########6| 92/95 [00:41<00:01, 2.26it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9685, LAS: 0.9399, UEM: 0.7062, LEM: 0.4987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7743, loss: 0.4859, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||: 100%|##########| 95/95 [00:43<00:00, 2.19it/s]\n", + "2023-04-07 02:12:55,913 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - reg_loss | 0.186 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UEM | 0.706 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - LEM | 0.499 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EM | 0.900 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.867 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.519 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - loss | 0.486 | N/A\n", + "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - LAS | 0.940 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:12:55,921 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:13:00,792 - INFO - combo.training.trainer - Epoch duration: 0:00:51.529326\n", + "2023-04-07 02:13:00,792 - INFO - combo.training.trainer - Estimated training time remaining: 4:11:08\n", + "2023-04-07 02:13:00,792 - INFO - allennlp.training.trainer - Epoch 179/399\n", + "2023-04-07 02:13:00,793 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:13:00,793 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:13:00,803 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9487, UAS: 0.9741, LAS: 0.9447, UEM: 0.7545, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.2657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.4412, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 5%|5 | 5/95 [00:02<00:38, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9696, LAS: 0.9413, UEM: 0.6951, LEM: 0.4698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5352, loss: 0.4716, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 11%|# | 10/95 [00:04<00:36, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9708, LAS: 0.9427, UEM: 0.7186, LEM: 0.4994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.2143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3804, loss: 0.4632, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 15%|#4 | 14/95 [00:06<00:36, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9694, LAS: 0.9418, UEM: 0.6895, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2626, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.4716, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 20%|## | 19/95 [00:08<00:33, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9676, LAS: 0.9401, UEM: 0.6739, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.3503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.4829, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||: 25%|##5 | 24/95 [00:10<00:30, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9674, LAS: 0.9396, UEM: 0.6575, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5876, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.4877, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||: 32%|###1 | 30/95 [00:12<00:27, 2.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9671, LAS: 0.9394, UEM: 0.6786, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1968, partial_loss/deprel_loss: 0.2692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4402, loss: 0.4889, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||: 37%|###6 | 35/95 [00:15<00:26, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9684, LAS: 0.9407, UEM: 0.6999, LEM: 0.4939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.2432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4114, loss: 0.4793, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||: 42%|####2 | 40/95 [00:17<00:24, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9685, LAS: 0.9408, UEM: 0.6923, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2838, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4662, loss: 0.4792, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||: 47%|####7 | 45/95 [00:19<00:21, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9688, LAS: 0.9413, UEM: 0.7222, LEM: 0.5253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.2620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.4761, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.18it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9684, LAS: 0.9411, UEM: 0.7157, LEM: 0.5196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1743, partial_loss/deprel_loss: 0.2036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3832, loss: 0.4767, batch_reg_loss: 0.1855, reg_loss: 0.1855 ||: 58%|#####7 | 55/95 [00:24<00:18, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9665, UAS: 0.9681, LAS: 0.9410, UEM: 0.7111, LEM: 0.5155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0689, partial_loss/deprel_loss: 0.1774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3412, loss: 0.4791, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||: 63%|######3 | 60/95 [00:26<00:15, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9680, LAS: 0.9409, UEM: 0.7069, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2347, partial_loss/deprel_loss: 0.2438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4274, loss: 0.4796, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||: 68%|######8 | 65/95 [00:28<00:13, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9678, LAS: 0.9407, UEM: 0.7068, LEM: 0.5081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1226, partial_loss/deprel_loss: 0.2546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.4802, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9683, LAS: 0.9412, UEM: 0.7103, LEM: 0.5114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.2432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.4771, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||: 79%|#######8 | 75/95 [00:33<00:08, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9686, LAS: 0.9413, UEM: 0.7199, LEM: 0.5234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1272, partial_loss/deprel_loss: 0.2134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3815, loss: 0.4750, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||: 84%|########4 | 80/95 [00:35<00:06, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9682, LAS: 0.9409, UEM: 0.7135, LEM: 0.5157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.4787, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 89%|########9 | 85/95 [00:38<00:04, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9685, LAS: 0.9411, UEM: 0.7142, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1888, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4239, loss: 0.4767, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 95%|#########4| 90/95 [00:40<00:02, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9684, LAS: 0.9411, UEM: 0.7093, LEM: 0.5086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.2169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3981, loss: 0.4780, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 100%|##########| 95/95 [00:42<00:00, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9684, LAS: 0.9411, UEM: 0.7093, LEM: 0.5086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.2169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3981, loss: 0.4780, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 100%|##########| 95/95 [00:42<00:00, 2.24it/s]\n", + "2023-04-07 02:13:46,147 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - reg_loss | 0.185 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UEM | 0.709 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LEM | 0.509 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EM | 0.959 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.196 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UAS | 0.968 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.217 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - loss | 0.478 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LAS | 0.941 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:13:46,153 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:13:50,367 - INFO - combo.training.trainer - Epoch duration: 0:00:49.574997\n", + "2023-04-07 02:13:50,368 - INFO - combo.training.trainer - Estimated training time remaining: 4:09:37\n", + "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - Epoch 180/399\n", + "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:13:50,376 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9666, LAS: 0.9383, UEM: 0.7143, LEM: 0.5138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6386, loss: 0.4976, batch_reg_loss: 0.1853, reg_loss: 0.1853 ||: 5%|5 | 5/95 [00:02<00:39, 2.31it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9725, LAS: 0.9441, UEM: 0.7695, LEM: 0.5583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4063, loss: 0.4607, batch_reg_loss: 0.1853, reg_loss: 0.1853 ||: 11%|# | 10/95 [00:04<00:37, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9703, LAS: 0.9421, UEM: 0.7411, LEM: 0.5255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.2397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4011, loss: 0.4728, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||: 16%|#5 | 15/95 [00:06<00:35, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9678, LAS: 0.9398, UEM: 0.7004, LEM: 0.4850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5309, partial_loss/deprel_loss: 0.3997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6112, loss: 0.4891, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||: 21%|##1 | 20/95 [00:08<00:33, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9581, UAS: 0.9695, LAS: 0.9411, UEM: 0.7254, LEM: 0.5143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0978, partial_loss/deprel_loss: 0.1723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3426, loss: 0.4737, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||: 26%|##6 | 25/95 [00:11<00:31, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9715, LAS: 0.9437, UEM: 0.7774, LEM: 0.5921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0434, partial_loss/deprel_loss: 0.1056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2784, loss: 0.4567, batch_reg_loss: 0.1852, reg_loss: 0.1852 ||: 32%|###1 | 30/95 [00:14<00:31, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9523, UAS: 0.9717, LAS: 0.9443, UEM: 0.7673, LEM: 0.5787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.4575, batch_reg_loss: 0.1852, reg_loss: 0.1852 ||: 37%|###6 | 35/95 [00:16<00:28, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9710, LAS: 0.9432, UEM: 0.7501, LEM: 0.5583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4043, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.4664, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 42%|####2 | 40/95 [00:18<00:25, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9704, LAS: 0.9424, UEM: 0.7416, LEM: 0.5446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.2983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4587, loss: 0.4725, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 47%|####7 | 45/95 [00:20<00:22, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9699, LAS: 0.9418, UEM: 0.7404, LEM: 0.5427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1420, partial_loss/deprel_loss: 0.2244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3930, loss: 0.4751, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9608, UAS: 0.9702, LAS: 0.9422, UEM: 0.7406, LEM: 0.5428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0560, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3536, loss: 0.4727, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 58%|#####7 | 55/95 [00:25<00:18, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9693, LAS: 0.9415, UEM: 0.7310, LEM: 0.5324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8916, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.4766, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 63%|######3 | 60/95 [00:27<00:16, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9695, LAS: 0.9418, UEM: 0.7304, LEM: 0.5310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.1793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.4742, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||: 68%|######8 | 65/95 [00:29<00:13, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9691, LAS: 0.9413, UEM: 0.7234, LEM: 0.5233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8747, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.4777, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||: 74%|#######3 | 70/95 [00:32<00:11, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9691, LAS: 0.9412, UEM: 0.7214, LEM: 0.5210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3175, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.4768, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||: 79%|#######8 | 75/95 [00:34<00:09, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9689, LAS: 0.9411, UEM: 0.7181, LEM: 0.5174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4954, loss: 0.4772, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||: 84%|########4 | 80/95 [00:36<00:06, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9688, LAS: 0.9411, UEM: 0.7141, LEM: 0.5136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2639, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4673, loss: 0.4762, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 89%|########9 | 85/95 [00:38<00:04, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9688, LAS: 0.9411, UEM: 0.7095, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3271, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.4765, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 95%|#########4| 90/95 [00:41<00:02, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9687, LAS: 0.9410, UEM: 0.7068, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1697, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.4761, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 100%|##########| 95/95 [00:43<00:00, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9687, LAS: 0.9410, UEM: 0.7068, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1697, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.4761, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 100%|##########| 95/95 [00:43<00:00, 2.19it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:14:37,037 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9535, LAS: 0.9074, UEM: 0.7970, LEM: 0.5912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5753, partial_loss/deprel_loss: 16.2328, partial_loss/cycle_loss: 0.0000, batch_loss: 13.3013, loss: 7.2497, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9544, LAS: 0.9038, UEM: 0.7405, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0724, partial_loss/deprel_loss: 12.5631, partial_loss/cycle_loss: 0.0000, batch_loss: 10.2649, loss: 7.0178, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:04<00:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9519, LAS: 0.9015, UEM: 0.6893, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6453, partial_loss/deprel_loss: 6.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2296, loss: 7.0737, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.54it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9519, LAS: 0.9015, UEM: 0.6893, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6453, partial_loss/deprel_loss: 6.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2296, loss: 7.0737, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.57it/s]\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - reg_loss | 0.185 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UEM | 0.707 | 0.689\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - LEM | 0.504 | 0.416\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EM | 0.945 | 0.899\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.170 | 0.645\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | 0.952\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.267 | 6.376\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - loss | 0.476 | 7.074\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - LAS | 0.941 | 0.902\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:14:44,056 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:14:48,239 - INFO - combo.training.trainer - Epoch duration: 0:00:57.871390\n", + "2023-04-07 02:14:48,240 - INFO - combo.training.trainer - Estimated training time remaining: 4:08:16\n", + "2023-04-07 02:14:48,240 - INFO - allennlp.training.trainer - Epoch 181/399\n", + "2023-04-07 02:14:48,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:14:48,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:14:48,251 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9632, UAS: 0.9710, LAS: 0.9417, UEM: 0.7680, LEM: 0.5770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0552, partial_loss/deprel_loss: 0.1685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3308, loss: 0.4788, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 5%|5 | 5/95 [00:02<00:41, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9717, LAS: 0.9426, UEM: 0.7406, LEM: 0.5353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1134, partial_loss/deprel_loss: 0.1824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3535, loss: 0.4690, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 11%|# | 10/95 [00:04<00:39, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9691, LAS: 0.9408, UEM: 0.7014, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.2581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.4805, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 16%|#5 | 15/95 [00:06<00:36, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9685, LAS: 0.9408, UEM: 0.6720, LEM: 0.4638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.2683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4452, loss: 0.4799, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 21%|##1 | 20/95 [00:08<00:33, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9681, LAS: 0.9399, UEM: 0.6728, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.2204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.4819, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 26%|##6 | 25/95 [00:11<00:31, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9664, LAS: 0.9386, UEM: 0.6539, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2628, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4264, loss: 0.4863, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||: 32%|###1 | 30/95 [00:13<00:29, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9535, UAS: 0.9670, LAS: 0.9395, UEM: 0.6755, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2242, partial_loss/deprel_loss: 0.2373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.4807, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||: 37%|###6 | 35/95 [00:15<00:26, 2.26it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9672, LAS: 0.9397, UEM: 0.6724, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.2509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.4792, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||: 42%|####2 | 40/95 [00:17<00:24, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9681, LAS: 0.9407, UEM: 0.6855, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1212, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3980, loss: 0.4717, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||: 47%|####7 | 45/95 [00:19<00:21, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9687, LAS: 0.9412, UEM: 0.6877, LEM: 0.4805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1818, partial_loss/deprel_loss: 0.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.4700, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||: 53%|#####2 | 50/95 [00:22<00:19, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9687, LAS: 0.9412, UEM: 0.6919, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1079, partial_loss/deprel_loss: 0.2376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3965, loss: 0.4705, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||: 58%|#####7 | 55/95 [00:24<00:17, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9680, LAS: 0.9404, UEM: 0.7010, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8331, partial_loss/deprel_loss: 0.4301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6954, loss: 0.4739, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 63%|######3 | 60/95 [00:27<00:16, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9684, LAS: 0.9407, UEM: 0.7038, LEM: 0.4976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.4448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.4739, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 68%|######8 | 65/95 [00:29<00:13, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9683, LAS: 0.9406, UEM: 0.7031, LEM: 0.4978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4556, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5480, loss: 0.4741, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9689, LAS: 0.9411, UEM: 0.7104, LEM: 0.5046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1098, partial_loss/deprel_loss: 0.2107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3752, loss: 0.4713, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 79%|#######8 | 75/95 [00:33<00:09, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9691, LAS: 0.9414, UEM: 0.7085, LEM: 0.5024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2873, partial_loss/deprel_loss: 0.2373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.4695, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 84%|########4 | 80/95 [00:35<00:06, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9689, LAS: 0.9411, UEM: 0.7038, LEM: 0.4966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1614, partial_loss/deprel_loss: 0.2006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3774, loss: 0.4733, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||: 89%|########9 | 85/95 [00:38<00:04, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9686, LAS: 0.9409, UEM: 0.7077, LEM: 0.5081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4128, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.4748, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||: 95%|#########4| 90/95 [00:40<00:02, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9686, LAS: 0.9408, UEM: 0.7062, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4757, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||: 100%|##########| 95/95 [00:42<00:00, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9686, LAS: 0.9408, UEM: 0.7062, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4757, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||: 100%|##########| 95/95 [00:42<00:00, 2.22it/s]\n", + "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - reg_loss | 0.185 | N/A\n", + "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - UEM | 0.706 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - LEM | 0.504 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - EM | 0.935 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.286 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.317 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - loss | 0.476 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - LAS | 0.941 | N/A\n", + "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:15:34,195 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:15:38,586 - INFO - combo.training.trainer - Epoch duration: 0:00:50.345983\n", + "2023-04-07 02:15:38,586 - INFO - combo.training.trainer - Estimated training time remaining: 4:06:47\n", + "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - Epoch 182/399\n", + "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:15:38,594 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9589, LAS: 0.9323, UEM: 0.4513, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8072, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.5557, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||: 5%|5 | 5/95 [00:02<00:37, 2.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9632, LAS: 0.9373, UEM: 0.6926, LEM: 0.5358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0722, partial_loss/deprel_loss: 0.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3038, loss: 0.5093, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||: 11%|# | 10/95 [00:04<00:36, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9643, LAS: 0.9378, UEM: 0.6684, LEM: 0.5039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3727, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.5034, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||: 16%|#5 | 15/95 [00:06<00:34, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9642, LAS: 0.9372, UEM: 0.6723, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2291, partial_loss/deprel_loss: 0.2518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4318, loss: 0.5044, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||: 21%|##1 | 20/95 [00:08<00:32, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9656, LAS: 0.9386, UEM: 0.6941, LEM: 0.5172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0670, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3622, loss: 0.4949, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||: 26%|##6 | 25/95 [00:10<00:30, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9667, LAS: 0.9399, UEM: 0.6898, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2092, partial_loss/deprel_loss: 0.2409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.4878, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||: 32%|###1 | 30/95 [00:12<00:27, 2.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9673, LAS: 0.9401, UEM: 0.6961, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4122, partial_loss/deprel_loss: 0.3134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.4844, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||: 37%|###6 | 35/95 [00:15<00:25, 2.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9663, LAS: 0.9393, UEM: 0.6766, LEM: 0.4891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3957, partial_loss/deprel_loss: 0.3226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.4897, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||: 42%|####2 | 40/95 [00:17<00:23, 2.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9662, LAS: 0.9391, UEM: 0.6756, LEM: 0.4869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4823, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.4917, batch_reg_loss: 0.1845, reg_loss: 0.1845 ||: 47%|####7 | 45/95 [00:19<00:21, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9676, LAS: 0.9406, UEM: 0.6992, LEM: 0.5072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1197, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4158, loss: 0.4832, batch_reg_loss: 0.1845, reg_loss: 0.1845 ||: 53%|#####2 | 50/95 [00:21<00:20, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9677, LAS: 0.9404, UEM: 0.6934, LEM: 0.4971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4337, partial_loss/deprel_loss: 0.3512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.4848, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||: 58%|#####7 | 55/95 [00:23<00:17, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9682, LAS: 0.9411, UEM: 0.6925, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2274, partial_loss/deprel_loss: 0.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4278, loss: 0.4807, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||: 63%|######3 | 60/95 [00:26<00:15, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9522, UAS: 0.9685, LAS: 0.9413, UEM: 0.6904, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.2075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3957, loss: 0.4787, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||: 68%|######8 | 65/95 [00:28<00:12, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9687, LAS: 0.9414, UEM: 0.6932, LEM: 0.4907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.4779, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||: 74%|#######3 | 70/95 [00:30<00:11, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9692, LAS: 0.9419, UEM: 0.6971, LEM: 0.4931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.2595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4435, loss: 0.4745, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||: 79%|#######8 | 75/95 [00:32<00:09, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9688, LAS: 0.9415, UEM: 0.6922, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5407, partial_loss/deprel_loss: 0.3514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.4771, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 84%|########4 | 80/95 [00:37<00:08, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9689, LAS: 0.9418, UEM: 0.7071, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5852, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6193, loss: 0.4749, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 88%|########8 | 84/95 [00:39<00:06, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9691, LAS: 0.9419, UEM: 0.7056, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5391, loss: 0.4745, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 94%|#########3| 89/95 [00:41<00:03, 1.90it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9693, LAS: 0.9421, UEM: 0.7087, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2439, partial_loss/deprel_loss: 0.2633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.4740, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 99%|#########8| 94/95 [00:44<00:00, 1.97it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9694, LAS: 0.9422, UEM: 0.7084, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.2740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4383, loss: 0.4736, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 100%|##########| 95/95 [00:44<00:00, 2.14it/s]\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - reg_loss | 0.184 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - UEM | 0.708 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - LEM | 0.510 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EM | 0.948 | N/A\n", + "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.174 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.274 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - loss | 0.474 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - LAS | 0.942 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:16:25,870 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:16:29,983 - INFO - combo.training.trainer - Epoch duration: 0:00:51.396437\n", + "2023-04-07 02:16:29,983 - INFO - combo.training.trainer - Estimated training time remaining: 4:05:20\n", + "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - Epoch 183/399\n", + "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:16:29,992 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9736, LAS: 0.9450, UEM: 0.7081, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3990, loss: 0.4526, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||: 5%|5 | 5/95 [00:02<00:38, 2.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9648, LAS: 0.9359, UEM: 0.6100, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.3098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.5070, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||: 11%|# | 10/95 [00:04<00:36, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9680, LAS: 0.9394, UEM: 0.6750, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.2077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3821, loss: 0.4776, batch_reg_loss: 0.1842, reg_loss: 0.1843 ||: 16%|#5 | 15/95 [00:06<00:34, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9706, LAS: 0.9418, UEM: 0.7283, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2150, partial_loss/deprel_loss: 0.2509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4279, loss: 0.4616, batch_reg_loss: 0.1842, reg_loss: 0.1843 ||: 21%|##1 | 20/95 [00:08<00:32, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9682, LAS: 0.9397, UEM: 0.6953, LEM: 0.4727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3700, partial_loss/deprel_loss: 0.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5297, loss: 0.4773, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||: 26%|##6 | 25/95 [00:10<00:30, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9699, LAS: 0.9416, UEM: 0.7165, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0679, partial_loss/deprel_loss: 0.1659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3305, loss: 0.4651, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||: 32%|###1 | 30/95 [00:13<00:28, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9707, LAS: 0.9429, UEM: 0.7351, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2346, partial_loss/deprel_loss: 0.2264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4122, loss: 0.4562, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||: 37%|###6 | 35/95 [00:15<00:26, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9701, LAS: 0.9425, UEM: 0.7245, LEM: 0.5128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2820, partial_loss/deprel_loss: 0.2577, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4467, loss: 0.4615, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||: 42%|####2 | 40/95 [00:17<00:24, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9694, LAS: 0.9419, UEM: 0.7106, LEM: 0.4996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4482, loss: 0.4674, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||: 47%|####7 | 45/95 [00:19<00:21, 2.27it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9702, LAS: 0.9424, UEM: 0.7154, LEM: 0.5002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1348, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.4638, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||: 53%|#####2 | 50/95 [00:21<00:19, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9709, LAS: 0.9432, UEM: 0.7288, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.2281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3880, loss: 0.4582, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||: 58%|#####7 | 55/95 [00:24<00:17, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9709, LAS: 0.9432, UEM: 0.7273, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5454, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.4585, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||: 63%|######3 | 60/95 [00:26<00:16, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9709, LAS: 0.9431, UEM: 0.7266, LEM: 0.5144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0981, partial_loss/deprel_loss: 0.2148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3755, loss: 0.4597, batch_reg_loss: 0.1840, reg_loss: 0.1842 ||: 68%|######8 | 65/95 [00:28<00:13, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9707, LAS: 0.9428, UEM: 0.7228, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4872, loss: 0.4622, batch_reg_loss: 0.1840, reg_loss: 0.1842 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9700, LAS: 0.9423, UEM: 0.7160, LEM: 0.5036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.2177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3907, loss: 0.4662, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||: 79%|#######8 | 75/95 [00:33<00:09, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9697, LAS: 0.9418, UEM: 0.7115, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3087, partial_loss/deprel_loss: 0.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5112, loss: 0.4701, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||: 84%|########4 | 80/95 [00:35<00:06, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9701, LAS: 0.9424, UEM: 0.7249, LEM: 0.5196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.2391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.4662, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||: 89%|########9 | 85/95 [00:38<00:04, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9698, LAS: 0.9421, UEM: 0.7194, LEM: 0.5130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3806, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.4687, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||: 95%|#########4| 90/95 [00:40<00:02, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9691, LAS: 0.9415, UEM: 0.7092, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5814, loss: 0.4741, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||: 100%|##########| 95/95 [00:42<00:00, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9691, LAS: 0.9415, UEM: 0.7092, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5814, loss: 0.4741, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||: 100%|##########| 95/95 [00:42<00:00, 2.23it/s]\n", + "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - reg_loss | 0.184 | N/A\n", + "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UEM | 0.709 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - LEM | 0.504 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - EM | 0.926 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.493 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.374 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - loss | 0.474 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - LAS | 0.941 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:17:15,949 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:17:19,499 - INFO - combo.training.trainer - Epoch duration: 0:00:49.514962\n", + "2023-04-07 02:17:19,499 - INFO - combo.training.trainer - Estimated training time remaining: 4:03:50\n", + "2023-04-07 02:17:19,499 - INFO - allennlp.training.trainer - Epoch 184/399\n", + "2023-04-07 02:17:19,500 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:17:19,501 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:17:19,510 - INFO - allennlp.training.trainer - Training\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9601, UAS: 0.9756, LAS: 0.9476, UEM: 0.7727, LEM: 0.5719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0784, partial_loss/deprel_loss: 0.1610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3284, loss: 0.4333, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||: 5%|5 | 5/95 [00:02<00:37, 2.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9734, LAS: 0.9460, UEM: 0.7501, LEM: 0.5449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1814, partial_loss/deprel_loss: 0.2370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4097, loss: 0.4404, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||: 11%|# | 10/95 [00:04<00:36, 2.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9707, LAS: 0.9428, UEM: 0.7047, LEM: 0.4890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6634, partial_loss/deprel_loss: 0.4062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6415, loss: 0.4590, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||: 16%|#5 | 15/95 [00:06<00:33, 2.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9683, LAS: 0.9406, UEM: 0.6697, LEM: 0.4599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3319, partial_loss/deprel_loss: 0.4034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.4729, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||: 21%|##1 | 20/95 [00:08<00:31, 2.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9671, LAS: 0.9396, UEM: 0.6771, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9460, partial_loss/deprel_loss: 0.4293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7165, loss: 0.4751, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||: 26%|##6 | 25/95 [00:10<00:30, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9554, UAS: 0.9685, LAS: 0.9412, UEM: 0.6890, LEM: 0.4775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1203, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3871, loss: 0.4683, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||: 33%|###2 | 31/95 [00:13<00:26, 2.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9686, LAS: 0.9412, UEM: 0.6822, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1838, partial_loss/deprel_loss: 0.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4080, loss: 0.4687, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||: 39%|###8 | 37/95 [00:15<00:23, 2.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9682, LAS: 0.9413, UEM: 0.7009, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6546, partial_loss/deprel_loss: 0.4432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6693, loss: 0.4710, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||: 44%|####4 | 42/95 [00:17<00:23, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9691, LAS: 0.9420, UEM: 0.7133, LEM: 0.5150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0854, partial_loss/deprel_loss: 0.1738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3399, loss: 0.4655, batch_reg_loss: 0.1838, reg_loss: 0.1838 ||: 49%|####9 | 47/95 [00:19<00:20, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9689, LAS: 0.9421, UEM: 0.7040, LEM: 0.5064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4696, loss: 0.4667, batch_reg_loss: 0.1838, reg_loss: 0.1838 ||: 55%|#####4 | 52/95 [00:22<00:18, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9395, UAS: 0.9690, LAS: 0.9420, UEM: 0.6976, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3717, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.4681, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 60%|###### | 57/95 [00:24<00:16, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9686, LAS: 0.9416, UEM: 0.6937, LEM: 0.4938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2831, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.4708, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 65%|######5 | 62/95 [00:26<00:14, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9693, LAS: 0.9423, UEM: 0.7034, LEM: 0.5028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3190, partial_loss/deprel_loss: 0.2927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4817, loss: 0.4677, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 71%|####### | 67/95 [00:29<00:12, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9694, LAS: 0.9424, UEM: 0.7031, LEM: 0.5013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1532, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4181, loss: 0.4677, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 76%|#######5 | 72/95 [00:31<00:10, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9687, LAS: 0.9417, UEM: 0.6940, LEM: 0.4925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8632, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7321, loss: 0.4724, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 81%|########1 | 77/95 [00:33<00:08, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9691, LAS: 0.9420, UEM: 0.7061, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5038, partial_loss/deprel_loss: 0.3411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.4695, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||: 86%|########6 | 82/95 [00:36<00:06, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9689, LAS: 0.9418, UEM: 0.7023, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1276, partial_loss/deprel_loss: 0.2435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.4710, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||: 92%|#########1| 87/95 [00:38<00:03, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9694, LAS: 0.9423, UEM: 0.7084, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2658, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4977, loss: 0.4680, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||: 97%|#########6| 92/95 [00:40<00:01, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9697, LAS: 0.9425, UEM: 0.7121, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1267, partial_loss/deprel_loss: 0.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3864, loss: 0.4661, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||: 100%|##########| 95/95 [00:41<00:00, 2.26it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:18:04,351 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - reg_loss | 0.184 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UEM | 0.712 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - LEM | 0.511 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EM | 0.954 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.127 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.222 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - loss | 0.466 | N/A\n", + "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - LAS | 0.943 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:18:04,358 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:18:08,062 - INFO - combo.training.trainer - Epoch duration: 0:00:48.562741\n", + "2023-04-07 02:18:08,062 - INFO - combo.training.trainer - Estimated training time remaining: 4:02:20\n", + "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - Epoch 185/399\n", + "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:18:08,077 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9713, LAS: 0.9422, UEM: 0.6968, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1323, partial_loss/deprel_loss: 0.2587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4686, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||: 5%|5 | 5/95 [00:02<00:36, 2.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9733, LAS: 0.9454, UEM: 0.7769, LEM: 0.5865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4205, partial_loss/deprel_loss: 0.3167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.4507, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||: 11%|# | 10/95 [00:04<00:35, 2.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9697, LAS: 0.9426, UEM: 0.7214, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 0.2448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4124, loss: 0.4648, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||: 16%|#5 | 15/95 [00:06<00:34, 2.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9487, UAS: 0.9696, LAS: 0.9425, UEM: 0.7060, LEM: 0.5067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2376, partial_loss/deprel_loss: 0.2455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4275, loss: 0.4680, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||: 22%|##2 | 21/95 [00:08<00:30, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9693, LAS: 0.9420, UEM: 0.6909, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5075, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5418, loss: 0.4694, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||: 27%|##7 | 26/95 [00:10<00:28, 2.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9561, UAS: 0.9686, LAS: 0.9415, UEM: 0.6786, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1308, partial_loss/deprel_loss: 0.2191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3850, loss: 0.4728, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||: 33%|###2 | 31/95 [00:12<00:26, 2.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9707, LAS: 0.9434, UEM: 0.7275, LEM: 0.5268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0810, partial_loss/deprel_loss: 0.1937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3547, loss: 0.4578, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||: 38%|###7 | 36/95 [00:15<00:25, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9684, LAS: 0.9412, UEM: 0.7247, LEM: 0.5329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.3145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5058, loss: 0.4714, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||: 43%|####3 | 41/95 [00:18<00:24, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9692, LAS: 0.9418, UEM: 0.7286, LEM: 0.5308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3186, partial_loss/deprel_loss: 0.3249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.4669, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||: 48%|####8 | 46/95 [00:20<00:22, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9696, LAS: 0.9421, UEM: 0.7231, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.2225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4037, loss: 0.4641, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||: 54%|#####3 | 51/95 [00:22<00:19, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9703, LAS: 0.9427, UEM: 0.7311, LEM: 0.5269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1679, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4382, loss: 0.4599, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||: 59%|#####8 | 56/95 [00:24<00:17, 2.21it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9704, LAS: 0.9428, UEM: 0.7298, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.3156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.4607, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||: 64%|######4 | 61/95 [00:27<00:15, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9706, LAS: 0.9430, UEM: 0.7294, LEM: 0.5232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1501, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.4599, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||: 69%|######9 | 66/95 [00:29<00:13, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9701, LAS: 0.9427, UEM: 0.7242, LEM: 0.5180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2449, partial_loss/deprel_loss: 0.2433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4270, loss: 0.4618, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||: 75%|#######4 | 71/95 [00:31<00:10, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9697, LAS: 0.9422, UEM: 0.7158, LEM: 0.5097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2932, partial_loss/deprel_loss: 0.3107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.4653, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||: 80%|######## | 76/95 [00:33<00:08, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9523, UAS: 0.9698, LAS: 0.9424, UEM: 0.7206, LEM: 0.5148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1798, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3985, loss: 0.4648, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||: 85%|########5 | 81/95 [00:36<00:06, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9545, UAS: 0.9701, LAS: 0.9426, UEM: 0.7232, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1152, partial_loss/deprel_loss: 0.2238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.4649, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||: 91%|######### | 86/95 [00:38<00:04, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9697, LAS: 0.9423, UEM: 0.7164, LEM: 0.5110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5114, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.4675, batch_reg_loss: 0.1833, reg_loss: 0.1834 ||: 96%|#########5| 91/95 [00:40<00:01, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9695, LAS: 0.9421, UEM: 0.7116, LEM: 0.5053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2759, partial_loss/deprel_loss: 0.2409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4312, loss: 0.4684, batch_reg_loss: 0.1833, reg_loss: 0.1834 ||: 100%|##########| 95/95 [00:42<00:00, 2.23it/s]\n", + "2023-04-07 02:18:53,988 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9645, LAS: 0.9191, UEM: 0.7971, LEM: 0.5561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 4.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7228, loss: 5.0399, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:02<00:04, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9536, LAS: 0.9045, UEM: 0.6965, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1079, partial_loss/deprel_loss: 7.6961, partial_loss/cycle_loss: 0.0000, batch_loss: 6.3784, loss: 6.6649, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 73%|#######2 | 8/11 [00:05<00:01, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9526, LAS: 0.9014, UEM: 0.6878, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5696, partial_loss/deprel_loss: 6.9750, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6939, loss: 6.9893, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00, 1.57it/s]\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - reg_loss | 0.183 | 0.000\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - UEM | 0.712 | 0.688\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - LEM | 0.505 | 0.416\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EM | 0.941 | 0.899\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.276 | 0.570\n", + "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | 0.953\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.241 | 6.975\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - loss | 0.468 | 6.989\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - LAS | 0.942 | 0.901\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:19:00,994 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:19:05,879 - INFO - combo.training.trainer - Epoch duration: 0:00:57.816087\n", + "2023-04-07 02:19:05,879 - INFO - combo.training.trainer - Estimated training time remaining: 4:01:01\n", + "2023-04-07 02:19:05,879 - INFO - allennlp.training.trainer - Epoch 186/399\n", + "2023-04-07 02:19:05,880 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:19:05,880 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:19:05,888 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9657, LAS: 0.9372, UEM: 0.6630, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1662, partial_loss/deprel_loss: 0.2648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4284, loss: 0.5067, batch_reg_loss: 0.1833, reg_loss: 0.1833 ||: 5%|5 | 5/95 [00:02<00:40, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9652, LAS: 0.9376, UEM: 0.6355, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2578, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.5016, batch_reg_loss: 0.1832, reg_loss: 0.1833 ||: 11%|# | 10/95 [00:04<00:38, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9661, LAS: 0.9395, UEM: 0.6360, LEM: 0.4271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4989, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.4916, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||: 16%|#5 | 15/95 [00:06<00:36, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9617, UAS: 0.9693, LAS: 0.9426, UEM: 0.6979, LEM: 0.4948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1027, partial_loss/deprel_loss: 0.2005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3642, loss: 0.4722, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||: 21%|##1 | 20/95 [00:09<00:34, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9701, LAS: 0.9433, UEM: 0.6981, LEM: 0.4870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.4657, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||: 26%|##6 | 25/95 [00:11<00:31, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9691, LAS: 0.9426, UEM: 0.6975, LEM: 0.4926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6066, partial_loss/deprel_loss: 0.3537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.4675, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||: 32%|###1 | 30/95 [00:13<00:30, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9689, LAS: 0.9426, UEM: 0.6882, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3191, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5180, loss: 0.4660, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||: 37%|###6 | 35/95 [00:15<00:26, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9689, LAS: 0.9425, UEM: 0.6775, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3450, partial_loss/deprel_loss: 0.3127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5023, loss: 0.4663, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 42%|####2 | 40/95 [00:18<00:24, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9542, UAS: 0.9680, LAS: 0.9416, UEM: 0.6728, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.2079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3765, loss: 0.4703, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 47%|####7 | 45/95 [00:20<00:22, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9686, LAS: 0.9422, UEM: 0.6827, LEM: 0.4776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1947, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4214, loss: 0.4682, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9677, LAS: 0.9412, UEM: 0.6730, LEM: 0.4682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1068, partial_loss/deprel_loss: 0.2095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3721, loss: 0.4745, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 58%|#####7 | 55/95 [00:25<00:18, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9680, LAS: 0.9414, UEM: 0.6839, LEM: 0.4801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2162, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4327, loss: 0.4726, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 63%|######3 | 60/95 [00:27<00:15, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9677, LAS: 0.9412, UEM: 0.6740, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2590, partial_loss/deprel_loss: 0.2636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.4741, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||: 68%|######8 | 65/95 [00:29<00:13, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9296, UAS: 0.9678, LAS: 0.9413, UEM: 0.6783, LEM: 0.4759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4853, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.4748, batch_reg_loss: 0.1830, reg_loss: 0.1832 ||: 74%|#######3 | 70/95 [00:32<00:11, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9683, LAS: 0.9417, UEM: 0.6893, LEM: 0.4874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3323, partial_loss/deprel_loss: 0.3248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.4712, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 79%|#######8 | 75/95 [00:34<00:09, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9690, LAS: 0.9425, UEM: 0.6999, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3904, loss: 0.4659, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 84%|########4 | 80/95 [00:36<00:06, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9694, LAS: 0.9429, UEM: 0.7109, LEM: 0.5137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.2877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.4625, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 89%|########9 | 85/95 [00:39<00:04, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9688, LAS: 0.9424, UEM: 0.7054, LEM: 0.5069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4620, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.4659, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 95%|#########4| 90/95 [00:41<00:02, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9692, LAS: 0.9427, UEM: 0.7096, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.4638, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 100%|##########| 95/95 [00:43<00:00, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9692, LAS: 0.9427, UEM: 0.7096, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.4638, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 100%|##########| 95/95 [00:43<00:00, 2.20it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - reg_loss | 0.183 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - UEM | 0.710 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - LEM | 0.509 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EM | 0.938 | N/A\n", + "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.348 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.310 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - loss | 0.464 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - LAS | 0.943 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:19:51,743 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:19:55,738 - INFO - combo.training.trainer - Epoch duration: 0:00:49.858388\n", + "2023-04-07 02:19:55,738 - INFO - combo.training.trainer - Estimated training time remaining: 3:59:34\n", + "2023-04-07 02:19:55,738 - INFO - allennlp.training.trainer - Epoch 187/399\n", + "2023-04-07 02:19:55,738 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:19:55,739 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:19:55,746 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9738, LAS: 0.9445, UEM: 0.7373, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1277, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3987, loss: 0.4425, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||: 5%|5 | 5/95 [00:02<00:44, 2.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9701, LAS: 0.9425, UEM: 0.6734, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1659, partial_loss/deprel_loss: 0.2346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4037, loss: 0.4636, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||: 11%|# | 10/95 [00:04<00:40, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9687, LAS: 0.9405, UEM: 0.6641, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4510, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.4761, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||: 16%|#5 | 15/95 [00:06<00:36, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9681, LAS: 0.9403, UEM: 0.6361, LEM: 0.4227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2226, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.4780, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||: 21%|##1 | 20/95 [00:08<00:33, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9676, LAS: 0.9398, UEM: 0.6648, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1633, partial_loss/deprel_loss: 0.2320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4011, loss: 0.4773, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||: 26%|##6 | 25/95 [00:11<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9700, LAS: 0.9428, UEM: 0.7328, LEM: 0.5448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1102, partial_loss/deprel_loss: 0.2185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 0.4601, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||: 32%|###1 | 30/95 [00:13<00:30, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9706, LAS: 0.9435, UEM: 0.7399, LEM: 0.5511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1414, partial_loss/deprel_loss: 0.2290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3943, loss: 0.4567, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||: 37%|###6 | 35/95 [00:15<00:27, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9550, UAS: 0.9713, LAS: 0.9441, UEM: 0.7467, LEM: 0.5537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1221, partial_loss/deprel_loss: 0.2234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3859, loss: 0.4536, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||: 42%|####2 | 40/95 [00:18<00:25, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9698, LAS: 0.9424, UEM: 0.7320, LEM: 0.5373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.4639, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||: 47%|####7 | 45/95 [00:20<00:23, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9387, UAS: 0.9692, LAS: 0.9415, UEM: 0.7200, LEM: 0.5233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.2722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4411, loss: 0.4696, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9697, LAS: 0.9423, UEM: 0.7238, LEM: 0.5278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.4640, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 58%|#####7 | 55/95 [00:25<00:18, 2.16it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9697, LAS: 0.9424, UEM: 0.7291, LEM: 0.5372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1354, partial_loss/deprel_loss: 0.2235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3886, loss: 0.4627, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 63%|######3 | 60/95 [00:27<00:16, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9696, LAS: 0.9423, UEM: 0.7209, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.2856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4409, loss: 0.4656, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 68%|######8 | 65/95 [00:29<00:13, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9699, LAS: 0.9426, UEM: 0.7262, LEM: 0.5327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0640, partial_loss/deprel_loss: 0.2180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3699, loss: 0.4637, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 74%|#######3 | 70/95 [00:32<00:11, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9700, LAS: 0.9426, UEM: 0.7239, LEM: 0.5272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.2182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3848, loss: 0.4625, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 79%|#######8 | 75/95 [00:34<00:08, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9704, LAS: 0.9430, UEM: 0.7238, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3018, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.4602, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||: 84%|########4 | 80/95 [00:36<00:06, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9702, LAS: 0.9427, UEM: 0.7180, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4883, loss: 0.4630, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||: 91%|######### | 86/95 [00:38<00:03, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9696, LAS: 0.9422, UEM: 0.7158, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4609, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5194, loss: 0.4663, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||: 96%|#########5| 91/95 [00:40<00:01, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9692, LAS: 0.9417, UEM: 0.7090, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5085, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.4697, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||: 100%|##########| 95/95 [00:42<00:00, 2.24it/s]\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - reg_loss | 0.183 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UEM | 0.709 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - LEM | 0.509 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.508 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UAS | 0.969 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.367 | N/A\n", + "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - loss | 0.470 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - LAS | 0.942 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:20:40,927 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:20:44,479 - INFO - combo.training.trainer - Epoch duration: 0:00:48.740412\n", + "2023-04-07 02:20:44,479 - INFO - combo.training.trainer - Estimated training time remaining: 3:58:05\n", + "2023-04-07 02:20:44,479 - INFO - allennlp.training.trainer - Epoch 188/399\n", + "2023-04-07 02:20:44,480 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:20:44,481 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:20:44,491 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9801, LAS: 0.9529, UEM: 0.8096, LEM: 0.5966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2648, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.3854, batch_reg_loss: 0.1826, reg_loss: 0.1826 ||: 5%|5 | 5/95 [00:02<00:37, 2.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9742, LAS: 0.9481, UEM: 0.7212, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2372, partial_loss/deprel_loss: 0.2542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4334, loss: 0.4284, batch_reg_loss: 0.1826, reg_loss: 0.1826 ||: 11%|# | 10/95 [00:04<00:35, 2.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9751, LAS: 0.9487, UEM: 0.7435, LEM: 0.5323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.2284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4036, loss: 0.4221, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||: 16%|#5 | 15/95 [00:06<00:34, 2.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9750, LAS: 0.9483, UEM: 0.7447, LEM: 0.5299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1541, partial_loss/deprel_loss: 0.1990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3726, loss: 0.4249, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||: 21%|##1 | 20/95 [00:08<00:33, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9740, LAS: 0.9479, UEM: 0.7233, LEM: 0.5085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.4316, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||: 26%|##6 | 25/95 [00:10<00:30, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9734, LAS: 0.9470, UEM: 0.7199, LEM: 0.5031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1018, partial_loss/deprel_loss: 0.2249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3828, loss: 0.4370, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||: 32%|###1 | 30/95 [00:13<00:28, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9728, LAS: 0.9462, UEM: 0.7209, LEM: 0.5014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4609, loss: 0.4429, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||: 37%|###6 | 35/95 [00:15<00:26, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9717, LAS: 0.9452, UEM: 0.7065, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.2881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4731, loss: 0.4492, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||: 42%|####2 | 40/95 [00:17<00:23, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9723, LAS: 0.9455, UEM: 0.7222, LEM: 0.5056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3109, partial_loss/deprel_loss: 0.3028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.4452, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 47%|####7 | 45/95 [00:19<00:22, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9719, LAS: 0.9452, UEM: 0.7191, LEM: 0.5032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0901, partial_loss/deprel_loss: 0.2167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3738, loss: 0.4478, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 53%|#####2 | 50/95 [00:22<00:19, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9707, LAS: 0.9439, UEM: 0.7071, LEM: 0.4909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2655, partial_loss/deprel_loss: 0.3009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.4575, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 58%|#####7 | 55/95 [00:24<00:17, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9697, LAS: 0.9428, UEM: 0.6977, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2602, partial_loss/deprel_loss: 0.2986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4733, loss: 0.4643, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 63%|######3 | 60/95 [00:26<00:15, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9696, LAS: 0.9427, UEM: 0.6931, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.3783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5776, loss: 0.4668, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 68%|######8 | 65/95 [00:28<00:13, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9698, LAS: 0.9427, UEM: 0.6992, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5744, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.4668, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9698, LAS: 0.9429, UEM: 0.7004, LEM: 0.4858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1531, partial_loss/deprel_loss: 0.2386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.4653, batch_reg_loss: 0.1823, reg_loss: 0.1825 ||: 79%|#######8 | 75/95 [00:33<00:09, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9692, LAS: 0.9423, UEM: 0.6951, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5602, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.4688, batch_reg_loss: 0.1823, reg_loss: 0.1825 ||: 84%|########4 | 80/95 [00:36<00:07, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9699, LAS: 0.9431, UEM: 0.7190, LEM: 0.5157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0234, partial_loss/deprel_loss: 0.1003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2672, loss: 0.4637, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 89%|########9 | 85/95 [00:38<00:04, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9700, LAS: 0.9432, UEM: 0.7213, LEM: 0.5185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0915, partial_loss/deprel_loss: 0.1827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3468, loss: 0.4623, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 95%|#########4| 90/95 [00:40<00:02, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9697, LAS: 0.9429, UEM: 0.7152, LEM: 0.5121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.4639, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 100%|##########| 95/95 [00:42<00:00, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9697, LAS: 0.9429, UEM: 0.7152, LEM: 0.5121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.4639, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 100%|##########| 95/95 [00:42<00:00, 2.21it/s]\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - reg_loss | 0.182 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - UEM | 0.715 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - LEM | 0.512 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EM | 0.934 | N/A\n", + "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.426 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.344 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - loss | 0.464 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - LAS | 0.943 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:21:30,463 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:21:34,372 - INFO - combo.training.trainer - Epoch duration: 0:00:49.892762\n", + "2023-04-07 02:21:34,372 - INFO - combo.training.trainer - Estimated training time remaining: 3:56:38\n", + "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - Epoch 189/399\n", + "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:21:34,382 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9734, LAS: 0.9445, UEM: 0.7078, LEM: 0.4754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.1919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3572, loss: 0.4531, batch_reg_loss: 0.1823, reg_loss: 0.1823 ||: 5%|5 | 5/95 [00:02<00:37, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9699, LAS: 0.9423, UEM: 0.6860, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4790, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5628, loss: 0.4679, batch_reg_loss: 0.1822, reg_loss: 0.1823 ||: 12%|#1 | 11/95 [00:04<00:34, 2.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9651, LAS: 0.9384, UEM: 0.6247, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8505, partial_loss/deprel_loss: 0.4051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6764, loss: 0.4925, batch_reg_loss: 0.1822, reg_loss: 0.1823 ||: 17%|#6 | 16/95 [00:06<00:32, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9659, LAS: 0.9389, UEM: 0.6478, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1255, partial_loss/deprel_loss: 0.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3679, loss: 0.4855, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||: 22%|##2 | 21/95 [00:09<00:32, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9671, LAS: 0.9400, UEM: 0.6776, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.4797, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||: 27%|##7 | 26/95 [00:11<00:30, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9684, LAS: 0.9412, UEM: 0.7049, LEM: 0.4990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1352, partial_loss/deprel_loss: 0.2439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.4711, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||: 33%|###2 | 31/95 [00:13<00:29, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9439, UAS: 0.9696, LAS: 0.9427, UEM: 0.7321, LEM: 0.5369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2710, partial_loss/deprel_loss: 0.2446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4321, loss: 0.4622, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||: 38%|###7 | 36/95 [00:16<00:27, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9507, UAS: 0.9686, LAS: 0.9421, UEM: 0.7178, LEM: 0.5225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.2257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4049, loss: 0.4658, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||: 43%|####3 | 41/95 [00:18<00:24, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9681, LAS: 0.9415, UEM: 0.7043, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3203, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4757, loss: 0.4691, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||: 48%|####8 | 46/95 [00:20<00:22, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9561, UAS: 0.9690, LAS: 0.9422, UEM: 0.7141, LEM: 0.5133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1231, partial_loss/deprel_loss: 0.1746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3464, loss: 0.4630, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||: 55%|#####4 | 52/95 [00:23<00:18, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9700, LAS: 0.9431, UEM: 0.7255, LEM: 0.5227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.3428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5122, loss: 0.4575, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||: 61%|######1 | 58/95 [00:25<00:15, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9706, LAS: 0.9436, UEM: 0.7270, LEM: 0.5214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1552, partial_loss/deprel_loss: 0.2337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.4545, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||: 66%|######6 | 63/95 [00:27<00:13, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9585, UAS: 0.9705, LAS: 0.9436, UEM: 0.7209, LEM: 0.5134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1139, partial_loss/deprel_loss: 0.2043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3683, loss: 0.4561, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||: 72%|#######1 | 68/95 [00:29<00:11, 2.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9705, LAS: 0.9435, UEM: 0.7166, LEM: 0.5079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2353, partial_loss/deprel_loss: 0.2779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4514, loss: 0.4572, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||: 77%|#######6 | 73/95 [00:31<00:09, 2.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9701, LAS: 0.9430, UEM: 0.7112, LEM: 0.5012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1620, partial_loss/deprel_loss: 0.2726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4325, loss: 0.4609, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||: 82%|########2 | 78/95 [00:33<00:07, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9704, LAS: 0.9434, UEM: 0.7200, LEM: 0.5111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4983, loss: 0.4580, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||: 87%|########7 | 83/95 [00:36<00:05, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9706, LAS: 0.9435, UEM: 0.7200, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2367, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4287, loss: 0.4566, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||: 93%|#########2| 88/95 [00:38<00:03, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9702, LAS: 0.9431, UEM: 0.7186, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8426, partial_loss/deprel_loss: 0.4660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7233, loss: 0.4596, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||: 98%|#########7| 93/95 [00:41<00:00, 2.16it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9704, LAS: 0.9433, UEM: 0.7191, LEM: 0.5098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3867, loss: 0.4587, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||: 100%|##########| 95/95 [00:41<00:00, 2.27it/s]\n", + "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - reg_loss | 0.182 | N/A\n", + "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UEM | 0.719 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LEM | 0.510 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - EM | 0.951 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.198 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.206 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - loss | 0.459 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LAS | 0.943 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:22:19,526 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:22:23,753 - INFO - combo.training.trainer - Epoch duration: 0:00:49.380132\n", + "2023-04-07 02:22:23,753 - INFO - combo.training.trainer - Estimated training time remaining: 3:55:11\n", + "2023-04-07 02:22:23,754 - INFO - allennlp.training.trainer - Epoch 190/399\n", + "2023-04-07 02:22:23,754 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:22:23,755 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:22:23,765 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9683, LAS: 0.9431, UEM: 0.6156, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1820, partial_loss/deprel_loss: 0.2421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4121, loss: 0.4673, batch_reg_loss: 0.1820, reg_loss: 0.1820 ||: 5%|5 | 5/95 [00:02<00:39, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9722, LAS: 0.9465, UEM: 0.7104, LEM: 0.4901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1259, partial_loss/deprel_loss: 0.2186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3820, loss: 0.4511, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 11%|# | 10/95 [00:04<00:38, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9674, LAS: 0.9419, UEM: 0.6680, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4621, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.4839, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 15%|#4 | 14/95 [00:06<00:37, 2.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9697, LAS: 0.9430, UEM: 0.7076, LEM: 0.4921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2136, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4147, loss: 0.4676, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 20%|## | 19/95 [00:08<00:34, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9694, LAS: 0.9427, UEM: 0.6963, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4350, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5418, loss: 0.4686, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 25%|##5 | 24/95 [00:10<00:31, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9601, UAS: 0.9705, LAS: 0.9440, UEM: 0.7347, LEM: 0.5340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0790, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3549, loss: 0.4606, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 29%|##9 | 28/95 [00:12<00:31, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9705, LAS: 0.9440, UEM: 0.7253, LEM: 0.5191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2995, partial_loss/deprel_loss: 0.2734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4621, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||: 35%|###4 | 33/95 [00:15<00:28, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9697, LAS: 0.9433, UEM: 0.7059, LEM: 0.4992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2593, partial_loss/deprel_loss: 0.2728, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.4638, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 40%|#### | 38/95 [00:17<00:26, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9704, LAS: 0.9442, UEM: 0.7282, LEM: 0.5355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3659, partial_loss/deprel_loss: 0.2750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4750, loss: 0.4565, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 45%|####5 | 43/95 [00:19<00:24, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9698, LAS: 0.9438, UEM: 0.7174, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.4600, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 51%|##### | 48/95 [00:21<00:21, 2.18it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9701, LAS: 0.9439, UEM: 0.7219, LEM: 0.5263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3302, partial_loss/deprel_loss: 0.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4811, loss: 0.4571, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 56%|#####5 | 53/95 [00:24<00:19, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9704, LAS: 0.9441, UEM: 0.7257, LEM: 0.5294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1361, partial_loss/deprel_loss: 0.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3964, loss: 0.4548, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 61%|######1 | 58/95 [00:26<00:16, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9708, LAS: 0.9445, UEM: 0.7259, LEM: 0.5276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1945, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.4531, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||: 66%|######6 | 63/95 [00:28<00:14, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9531, UAS: 0.9708, LAS: 0.9444, UEM: 0.7213, LEM: 0.5212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1591, partial_loss/deprel_loss: 0.2158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3862, loss: 0.4532, batch_reg_loss: 0.1817, reg_loss: 0.1819 ||: 72%|#######1 | 68/95 [00:30<00:12, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9708, LAS: 0.9443, UEM: 0.7210, LEM: 0.5207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1151, partial_loss/deprel_loss: 0.2258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.4537, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||: 77%|#######6 | 73/95 [00:33<00:09, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9708, LAS: 0.9442, UEM: 0.7237, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.2541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4278, loss: 0.4542, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||: 82%|########2 | 78/95 [00:35<00:07, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9702, LAS: 0.9438, UEM: 0.7130, LEM: 0.5141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4817, loss: 0.4579, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||: 87%|########7 | 83/95 [00:37<00:05, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9699, LAS: 0.9435, UEM: 0.7117, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7758, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.4598, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||: 93%|#########2| 88/95 [00:39<00:03, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9696, LAS: 0.9432, UEM: 0.7087, LEM: 0.5072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4431, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5639, loss: 0.4626, batch_reg_loss: 0.1816, reg_loss: 0.1818 ||: 99%|#########8| 94/95 [00:42<00:00, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9697, LAS: 0.9432, UEM: 0.7116, LEM: 0.5106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1498, partial_loss/deprel_loss: 0.2243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.4619, batch_reg_loss: 0.1816, reg_loss: 0.1818 ||: 100%|##########| 95/95 [00:42<00:00, 2.21it/s]\n", + "2023-04-07 02:23:09,717 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8558, UAS: 0.9366, LAS: 0.8829, UEM: 0.5207, LEM: 0.2590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6660, partial_loss/deprel_loss: 15.5290, partial_loss/cycle_loss: 0.0000, batch_loss: 12.7564, loss: 9.2649, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 27%|##7 | 3/11 [00:02<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9520, LAS: 0.9041, UEM: 0.7383, LEM: 0.4969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0763, partial_loss/deprel_loss: 7.6127, partial_loss/cycle_loss: 0.0000, batch_loss: 6.3054, loss: 6.6328, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:04<00:02, 1.48it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9520, LAS: 0.9007, UEM: 0.6888, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 8.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9736, loss: 6.7944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9520, LAS: 0.9007, UEM: 0.6888, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 8.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9736, loss: 6.7944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00, 1.59it/s]\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - reg_loss | 0.182 | 0.000\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UEM | 0.712 | 0.689\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - LEM | 0.511 | 0.416\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EM | 0.950 | 0.894\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.150 | 0.963\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | 0.952\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.224 | 8.476\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - loss | 0.462 | 6.794\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - LAS | 0.943 | 0.901\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:23:16,659 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:23:21,377 - INFO - combo.training.trainer - Epoch duration: 0:00:57.623587\n", + "2023-04-07 02:23:21,378 - INFO - combo.training.trainer - Estimated training time remaining: 3:53:53\n", + "2023-04-07 02:23:21,378 - INFO - allennlp.training.trainer - Epoch 191/399\n", + "2023-04-07 02:23:21,378 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:23:21,379 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:23:21,387 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9762, LAS: 0.9530, UEM: 0.8104, LEM: 0.6826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.4168, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||: 5%|5 | 5/95 [00:02<00:43, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9546, UAS: 0.9707, LAS: 0.9478, UEM: 0.7378, LEM: 0.5919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1372, partial_loss/deprel_loss: 0.2182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3836, loss: 0.4425, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||: 11%|# | 10/95 [00:04<00:40, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9730, LAS: 0.9487, UEM: 0.7628, LEM: 0.5917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1339, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4015, loss: 0.4341, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||: 16%|#5 | 15/95 [00:06<00:36, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9723, LAS: 0.9473, UEM: 0.7500, LEM: 0.5666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.4364, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||: 21%|##1 | 20/95 [00:09<00:35, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9455, UAS: 0.9718, LAS: 0.9467, UEM: 0.7363, LEM: 0.5494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2069, partial_loss/deprel_loss: 0.3008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4636, loss: 0.4407, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||: 26%|##6 | 25/95 [00:11<00:32, 2.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9727, LAS: 0.9474, UEM: 0.7427, LEM: 0.5499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4354, loss: 0.4369, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||: 32%|###1 | 30/95 [00:13<00:28, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9709, LAS: 0.9456, UEM: 0.7265, LEM: 0.5331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6162, loss: 0.4465, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||: 37%|###6 | 35/95 [00:15<00:26, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9701, LAS: 0.9450, UEM: 0.7112, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.2685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4572, loss: 0.4508, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||: 43%|####3 | 41/95 [00:18<00:22, 2.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9503, UAS: 0.9708, LAS: 0.9456, UEM: 0.7304, LEM: 0.5394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2075, partial_loss/deprel_loss: 0.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4317, loss: 0.4471, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||: 48%|####8 | 46/95 [00:20<00:21, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9708, LAS: 0.9457, UEM: 0.7308, LEM: 0.5406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0844, partial_loss/deprel_loss: 0.1644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3299, loss: 0.4468, batch_reg_loss: 0.1815, reg_loss: 0.1815 ||: 54%|#####3 | 51/95 [00:22<00:19, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9709, LAS: 0.9458, UEM: 0.7358, LEM: 0.5494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.3087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.4456, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||: 59%|#####8 | 56/95 [00:24<00:17, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9710, LAS: 0.9459, UEM: 0.7306, LEM: 0.5424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2881, partial_loss/deprel_loss: 0.3186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.4462, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||: 64%|######4 | 61/95 [00:27<00:15, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9552, UAS: 0.9711, LAS: 0.9460, UEM: 0.7318, LEM: 0.5432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1279, partial_loss/deprel_loss: 0.2277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3891, loss: 0.4458, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||: 69%|######9 | 66/95 [00:29<00:12, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9712, LAS: 0.9460, UEM: 0.7271, LEM: 0.5366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3800, partial_loss/deprel_loss: 0.3084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5041, loss: 0.4449, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||: 75%|#######4 | 71/95 [00:31<00:10, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9539, UAS: 0.9709, LAS: 0.9455, UEM: 0.7214, LEM: 0.5291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.4481, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||: 80%|######## | 76/95 [00:33<00:08, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9463, UAS: 0.9710, LAS: 0.9455, UEM: 0.7300, LEM: 0.5386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2097, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4535, loss: 0.4480, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||: 85%|########5 | 81/95 [00:36<00:06, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9708, LAS: 0.9452, UEM: 0.7248, LEM: 0.5333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6504, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6334, loss: 0.4495, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||: 91%|######### | 86/95 [00:38<00:04, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9703, LAS: 0.9448, UEM: 0.7224, LEM: 0.5305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8756, partial_loss/deprel_loss: 0.3987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.4529, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||: 96%|#########5| 91/95 [00:41<00:01, 2.14it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9700, LAS: 0.9445, UEM: 0.7157, LEM: 0.5243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.3561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.4553, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||: 100%|##########| 95/95 [00:42<00:00, 2.22it/s]\n", + "2023-04-07 02:24:07,237 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - reg_loss | 0.181 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UEM | 0.716 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - LEM | 0.524 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EM | 0.930 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.431 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.356 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - loss | 0.455 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - LAS | 0.944 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:07,245 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:24:10,763 - INFO - combo.training.trainer - Epoch duration: 0:00:49.385025\n", + "2023-04-07 02:24:10,763 - INFO - combo.training.trainer - Estimated training time remaining: 3:52:27\n", + "2023-04-07 02:24:10,763 - INFO - allennlp.training.trainer - Epoch 192/399\n", + "2023-04-07 02:24:10,764 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:24:10,764 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:24:10,773 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9789, LAS: 0.9571, UEM: 0.8140, LEM: 0.6628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.1925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3687, loss: 0.3693, batch_reg_loss: 0.1813, reg_loss: 0.1813 ||: 5%|5 | 5/95 [00:02<00:40, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9768, LAS: 0.9515, UEM: 0.7751, LEM: 0.5848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1505, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4325, loss: 0.3985, batch_reg_loss: 0.1813, reg_loss: 0.1813 ||: 11%|# | 10/95 [00:04<00:37, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9755, LAS: 0.9494, UEM: 0.7461, LEM: 0.5409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.2681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4671, loss: 0.4175, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||: 16%|#5 | 15/95 [00:06<00:35, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9706, LAS: 0.9449, UEM: 0.6997, LEM: 0.5008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5681, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.4494, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||: 21%|##1 | 20/95 [00:08<00:32, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9695, LAS: 0.9437, UEM: 0.6775, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3712, loss: 0.4588, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||: 26%|##6 | 25/95 [00:10<00:30, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9399, UAS: 0.9710, LAS: 0.9448, UEM: 0.7127, LEM: 0.5073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3621, partial_loss/deprel_loss: 0.3050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.4494, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||: 32%|###1 | 30/95 [00:13<00:28, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9696, LAS: 0.9436, UEM: 0.6882, LEM: 0.4838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.4580, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||: 37%|###6 | 35/95 [00:15<00:27, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9696, LAS: 0.9434, UEM: 0.6808, LEM: 0.4750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3107, partial_loss/deprel_loss: 0.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4677, loss: 0.4592, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||: 42%|####2 | 40/95 [00:17<00:24, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9701, LAS: 0.9441, UEM: 0.6826, LEM: 0.4732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.2073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3882, loss: 0.4544, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||: 47%|####7 | 45/95 [00:19<00:22, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9690, LAS: 0.9429, UEM: 0.6746, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7076, partial_loss/deprel_loss: 0.3990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6418, loss: 0.4621, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 53%|#####2 | 50/95 [00:22<00:20, 2.17it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9628, UAS: 0.9695, LAS: 0.9435, UEM: 0.6949, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0965, partial_loss/deprel_loss: 0.1971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3581, loss: 0.4580, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 58%|#####7 | 55/95 [00:24<00:18, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9772, UAS: 0.9699, LAS: 0.9442, UEM: 0.7150, LEM: 0.5234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0246, partial_loss/deprel_loss: 0.0824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2520, loss: 0.4537, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 63%|######3 | 60/95 [00:27<00:16, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9705, LAS: 0.9448, UEM: 0.7184, LEM: 0.5227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.2958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4589, loss: 0.4506, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 68%|######8 | 65/95 [00:29<00:13, 2.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9705, LAS: 0.9448, UEM: 0.7193, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5896, partial_loss/deprel_loss: 0.3207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.4494, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 74%|#######3 | 70/95 [00:31<00:11, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9704, LAS: 0.9447, UEM: 0.7176, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1456, partial_loss/deprel_loss: 0.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4338, loss: 0.4503, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||: 79%|#######8 | 75/95 [00:33<00:09, 2.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9702, LAS: 0.9445, UEM: 0.7141, LEM: 0.5192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1663, partial_loss/deprel_loss: 0.2351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4024, loss: 0.4520, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||: 84%|########4 | 80/95 [00:36<00:06, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9522, UAS: 0.9703, LAS: 0.9446, UEM: 0.7100, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4226, loss: 0.4517, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||: 89%|########9 | 85/95 [00:38<00:04, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9703, LAS: 0.9445, UEM: 0.7135, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1958, partial_loss/deprel_loss: 0.2959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4569, loss: 0.4512, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||: 95%|#########4| 90/95 [00:40<00:02, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9705, LAS: 0.9447, UEM: 0.7152, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3115, partial_loss/deprel_loss: 0.2870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.4505, batch_reg_loss: 0.1810, reg_loss: 0.1811 ||: 100%|##########| 95/95 [00:42<00:00, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9705, LAS: 0.9447, UEM: 0.7152, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3115, partial_loss/deprel_loss: 0.2870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.4505, batch_reg_loss: 0.1810, reg_loss: 0.1811 ||: 100%|##########| 95/95 [00:42<00:00, 2.24it/s]\n", + "2023-04-07 02:24:55,870 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:24:55,870 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - reg_loss | 0.181 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UEM | 0.715 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LEM | 0.519 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EM | 0.945 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.311 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UAS | 0.971 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.287 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - loss | 0.450 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LAS | 0.945 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:24:55,876 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:24:59,808 - INFO - combo.training.trainer - Epoch duration: 0:00:49.044927\n", + "2023-04-07 02:24:59,809 - INFO - combo.training.trainer - Estimated training time remaining: 3:51:01\n", + "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - Epoch 193/399\n", + "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:24:59,816 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9712, LAS: 0.9460, UEM: 0.6768, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1532, partial_loss/deprel_loss: 0.1918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3650, loss: 0.4546, batch_reg_loss: 0.1810, reg_loss: 0.1810 ||: 5%|5 | 5/95 [00:02<00:37, 2.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9743, LAS: 0.9499, UEM: 0.7249, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1009, partial_loss/deprel_loss: 0.1800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3451, loss: 0.4308, batch_reg_loss: 0.1809, reg_loss: 0.1810 ||: 12%|#1 | 11/95 [00:04<00:34, 2.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9751, LAS: 0.9503, UEM: 0.7506, LEM: 0.5484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2127, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4513, loss: 0.4221, batch_reg_loss: 0.1809, reg_loss: 0.1810 ||: 17%|#6 | 16/95 [00:06<00:33, 2.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9543, UAS: 0.9744, LAS: 0.9492, UEM: 0.7438, LEM: 0.5364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4066, loss: 0.4259, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||: 22%|##2 | 21/95 [00:08<00:31, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9750, LAS: 0.9494, UEM: 0.7493, LEM: 0.5388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2943, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.4243, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||: 27%|##7 | 26/95 [00:11<00:29, 2.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9720, LAS: 0.9467, UEM: 0.7135, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4501, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.4414, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||: 33%|###2 | 31/95 [00:13<00:27, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9707, LAS: 0.9454, UEM: 0.6946, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2969, partial_loss/deprel_loss: 0.3191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4955, loss: 0.4463, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 38%|###7 | 36/95 [00:15<00:25, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9716, LAS: 0.9462, UEM: 0.7253, LEM: 0.5326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2574, partial_loss/deprel_loss: 0.2802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4565, loss: 0.4415, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 43%|####3 | 41/95 [00:18<00:24, 2.19it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9716, LAS: 0.9461, UEM: 0.7216, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.2556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4291, loss: 0.4434, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 48%|####8 | 46/95 [00:20<00:21, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9709, LAS: 0.9453, UEM: 0.7201, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.2232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.4483, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 54%|#####3 | 51/95 [00:22<00:20, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9491, UAS: 0.9708, LAS: 0.9452, UEM: 0.7142, LEM: 0.5176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.4499, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 59%|#####8 | 56/95 [00:25<00:18, 2.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9702, LAS: 0.9444, UEM: 0.7056, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.2712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4542, loss: 0.4541, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 64%|######4 | 61/95 [00:27<00:15, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9463, UAS: 0.9708, LAS: 0.9450, UEM: 0.7201, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2971, partial_loss/deprel_loss: 0.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.4490, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||: 69%|######9 | 66/95 [00:29<00:13, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9711, LAS: 0.9454, UEM: 0.7264, LEM: 0.5341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4482, loss: 0.4458, batch_reg_loss: 0.1807, reg_loss: 0.1809 ||: 75%|#######4 | 71/95 [00:34<00:14, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9713, LAS: 0.9456, UEM: 0.7259, LEM: 0.5322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4021, loss: 0.4462, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 80%|######## | 76/95 [00:36<00:10, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9706, LAS: 0.9448, UEM: 0.7206, LEM: 0.5273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8308, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7229, loss: 0.4521, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 85%|########5 | 81/95 [00:38<00:07, 1.93it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9705, LAS: 0.9447, UEM: 0.7170, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0917, partial_loss/deprel_loss: 0.2132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3696, loss: 0.4528, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 91%|######### | 86/95 [00:40<00:04, 2.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9710, LAS: 0.9451, UEM: 0.7263, LEM: 0.5314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0982, partial_loss/deprel_loss: 0.1860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3491, loss: 0.4496, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 96%|#########5| 91/95 [00:43<00:01, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9379, UAS: 0.9704, LAS: 0.9445, UEM: 0.7170, LEM: 0.5231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5476, partial_loss/deprel_loss: 0.3039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5333, loss: 0.4536, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 100%|##########| 95/95 [00:45<00:00, 2.11it/s]\n", + "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - reg_loss | 0.181 | N/A\n", + "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UEM | 0.717 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LEM | 0.523 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - EM | 0.938 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.548 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.304 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - loss | 0.454 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LAS | 0.945 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:25:47,754 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:25:47,754 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:25:47,758 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:25:52,111 - INFO - combo.training.trainer - Epoch duration: 0:00:52.302130\n", + "2023-04-07 02:25:52,111 - INFO - combo.training.trainer - Estimated training time remaining: 3:49:38\n", + "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - Epoch 194/399\n", + "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:25:52,121 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9784, UAS: 0.9727, LAS: 0.9475, UEM: 0.8671, LEM: 0.7463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0226, partial_loss/deprel_loss: 0.0932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2598, loss: 0.4254, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 4%|4 | 4/95 [00:02<00:46, 1.97it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9729, LAS: 0.9472, UEM: 0.8300, LEM: 0.6810, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0788, partial_loss/deprel_loss: 0.1887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3473, loss: 0.4168, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 9%|9 | 9/95 [00:04<00:42, 2.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9737, LAS: 0.9473, UEM: 0.7973, LEM: 0.6318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3108, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5310, loss: 0.4248, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 15%|#4 | 14/95 [00:06<00:38, 2.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9531, UAS: 0.9739, LAS: 0.9478, UEM: 0.7835, LEM: 0.6102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.2080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3785, loss: 0.4242, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 20%|## | 19/95 [00:08<00:36, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9668, UAS: 0.9741, LAS: 0.9482, UEM: 0.7857, LEM: 0.6130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0600, partial_loss/deprel_loss: 0.1196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2882, loss: 0.4240, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 25%|##5 | 24/95 [00:11<00:34, 2.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9724, LAS: 0.9465, UEM: 0.7654, LEM: 0.5906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.4365, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||: 31%|### | 29/95 [00:13<00:31, 2.12it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9725, LAS: 0.9466, UEM: 0.7548, LEM: 0.5730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2552, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.4383, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||: 37%|###6 | 35/95 [00:15<00:26, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9720, LAS: 0.9462, UEM: 0.7437, LEM: 0.5612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2174, partial_loss/deprel_loss: 0.2386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.4398, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||: 42%|####2 | 40/95 [00:18<00:24, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9708, LAS: 0.9450, UEM: 0.7368, LEM: 0.5538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8662, partial_loss/deprel_loss: 0.4060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6785, loss: 0.4482, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||: 47%|####7 | 45/95 [00:20<00:22, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9700, LAS: 0.9442, UEM: 0.7249, LEM: 0.5406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6876, partial_loss/deprel_loss: 0.3537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6009, loss: 0.4535, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||: 53%|#####2 | 50/95 [00:22<00:19, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9699, LAS: 0.9442, UEM: 0.7165, LEM: 0.5298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4022, partial_loss/deprel_loss: 0.3170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.4529, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||: 58%|#####7 | 55/95 [00:24<00:17, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9699, LAS: 0.9441, UEM: 0.7215, LEM: 0.5327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6227, partial_loss/deprel_loss: 0.3280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5674, loss: 0.4533, batch_reg_loss: 0.1805, reg_loss: 0.1805 ||: 63%|######3 | 60/95 [00:26<00:15, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9702, LAS: 0.9444, UEM: 0.7187, LEM: 0.5262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0994, partial_loss/deprel_loss: 0.2168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3737, loss: 0.4522, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 68%|######8 | 65/95 [00:28<00:12, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9702, LAS: 0.9444, UEM: 0.7136, LEM: 0.5193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4027, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5431, loss: 0.4520, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 74%|#######3 | 70/95 [00:31<00:10, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9702, LAS: 0.9442, UEM: 0.7087, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1623, partial_loss/deprel_loss: 0.2495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4125, loss: 0.4532, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 79%|#######8 | 75/95 [00:33<00:08, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9700, LAS: 0.9440, UEM: 0.7087, LEM: 0.5108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2324, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3931, loss: 0.4542, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 84%|########4 | 80/95 [00:35<00:06, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9700, LAS: 0.9437, UEM: 0.7158, LEM: 0.5179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6074, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5768, loss: 0.4542, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 89%|########9 | 85/95 [00:37<00:04, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9704, LAS: 0.9442, UEM: 0.7185, LEM: 0.5193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2901, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.4521, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||: 95%|#########4| 90/95 [00:39<00:02, 2.27it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9706, LAS: 0.9443, UEM: 0.7174, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.4508, batch_reg_loss: 0.1803, reg_loss: 0.1805 ||: 100%|##########| 95/95 [00:42<00:00, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9706, LAS: 0.9443, UEM: 0.7174, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.4508, batch_reg_loss: 0.1803, reg_loss: 0.1805 ||: 100%|##########| 95/95 [00:42<00:00, 2.26it/s]\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - reg_loss | 0.180 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UEM | 0.717 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - LEM | 0.516 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EM | 0.949 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.172 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UAS | 0.971 | N/A\n", + "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.230 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - loss | 0.451 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - LAS | 0.944 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 02:26:36,889 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n", + "2023-04-07 02:26:41,701 - INFO - combo.training.trainer - Epoch duration: 0:00:49.589770\n", + "2023-04-07 02:26:41,702 - INFO - combo.training.trainer - Estimated training time remaining: 3:48:13\n", + "2023-04-07 02:26:41,702 - INFO - allennlp.training.trainer - Epoch 195/399\n", + "2023-04-07 02:26:41,702 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:26:41,703 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:26:41,710 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9720, LAS: 0.9488, UEM: 0.6780, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2827, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.4437, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||: 5%|5 | 5/95 [00:02<00:38, 2.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9784, LAS: 0.9557, UEM: 0.8436, LEM: 0.6916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1188, partial_loss/deprel_loss: 0.1871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3538, loss: 0.3926, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||: 9%|9 | 9/95 [00:04<00:38, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9762, LAS: 0.9520, UEM: 0.8126, LEM: 0.6409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4186, loss: 0.4159, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||: 15%|#4 | 14/95 [00:06<00:36, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9743, LAS: 0.9495, UEM: 0.7793, LEM: 0.6013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4681, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.4299, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||: 20%|## | 19/95 [00:08<00:34, 2.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9711, LAS: 0.9466, UEM: 0.7379, LEM: 0.5623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.2368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.4462, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||: 25%|##5 | 24/95 [00:10<00:31, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9395, UAS: 0.9702, LAS: 0.9454, UEM: 0.7296, LEM: 0.5485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2643, partial_loss/deprel_loss: 0.2978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4713, loss: 0.4505, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||: 31%|### | 29/95 [00:13<00:29, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9701, LAS: 0.9452, UEM: 0.7177, LEM: 0.5304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4225, loss: 0.4506, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||: 36%|###5 | 34/95 [00:15<00:26, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9700, LAS: 0.9451, UEM: 0.7127, LEM: 0.5224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4534, partial_loss/deprel_loss: 0.3090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5181, loss: 0.4517, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||: 41%|####1 | 39/95 [00:17<00:24, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9705, LAS: 0.9453, UEM: 0.7117, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2453, partial_loss/deprel_loss: 0.2147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4010, loss: 0.4485, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||: 46%|####6 | 44/95 [00:19<00:22, 2.23it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9692, LAS: 0.9440, UEM: 0.7051, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1320, partial_loss/deprel_loss: 0.1871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3562, loss: 0.4569, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||: 52%|#####1 | 49/95 [00:22<00:21, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9700, LAS: 0.9451, UEM: 0.7170, LEM: 0.5275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.2490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4358, loss: 0.4512, batch_reg_loss: 0.1802, reg_loss: 0.1802 ||: 57%|#####6 | 54/95 [00:24<00:19, 2.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9483, UAS: 0.9699, LAS: 0.9451, UEM: 0.7076, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3030, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4647, loss: 0.4522, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 63%|######3 | 60/95 [00:27<00:15, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9703, LAS: 0.9453, UEM: 0.7074, LEM: 0.5125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0932, partial_loss/deprel_loss: 0.1992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3581, loss: 0.4512, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 68%|######8 | 65/95 [00:29<00:13, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9641, UAS: 0.9701, LAS: 0.9452, UEM: 0.7060, LEM: 0.5122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0897, partial_loss/deprel_loss: 0.1406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3105, loss: 0.4523, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 74%|#######3 | 70/95 [00:31<00:10, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9703, LAS: 0.9452, UEM: 0.7059, LEM: 0.5089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.4509, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 79%|#######8 | 75/95 [00:33<00:08, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9475, UAS: 0.9696, LAS: 0.9444, UEM: 0.6974, LEM: 0.5001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.2326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4040, loss: 0.4551, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 84%|########4 | 80/95 [00:35<00:06, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9699, LAS: 0.9447, UEM: 0.7109, LEM: 0.5164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0795, partial_loss/deprel_loss: 0.1642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3273, loss: 0.4524, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||: 89%|########9 | 85/95 [00:38<00:04, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9697, LAS: 0.9445, UEM: 0.7068, LEM: 0.5130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1100, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3663, loss: 0.4535, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||: 95%|#########4| 90/95 [00:40<00:02, 2.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9702, LAS: 0.9449, UEM: 0.7149, LEM: 0.5209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0860, partial_loss/deprel_loss: 0.1579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.4497, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||: 100%|##########| 95/95 [00:42<00:00, 2.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9702, LAS: 0.9449, UEM: 0.7149, LEM: 0.5209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0860, partial_loss/deprel_loss: 0.1579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.4497, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||: 100%|##########| 95/95 [00:42<00:00, 2.23it/s]\n", + "2023-04-07 02:27:27,488 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/11 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9532, LAS: 0.9049, UEM: 0.6861, LEM: 0.4048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4058, partial_loss/deprel_loss: 6.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3561, loss: 6.3438, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 36%|###6 | 4/11 [00:02<00:04, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9536, LAS: 0.9068, UEM: 0.7453, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5532, partial_loss/deprel_loss: 15.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 12.7731, loss: 6.6323, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 64%|######3 | 7/11 [00:04<00:02, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9531, LAS: 0.9027, UEM: 0.6908, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5501, partial_loss/deprel_loss: 6.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5948, loss: 6.8042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.55it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9531, LAS: 0.9027, UEM: 0.6908, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5501, partial_loss/deprel_loss: 6.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5948, loss: 6.8042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00, 1.54it/s]\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - reg_loss | 0.180 | 0.000\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UEM | 0.715 | 0.691\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - LEM | 0.521 | 0.418\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EM | 0.957 | 0.903\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.086 | 0.550\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UAS | 0.970 | 0.953\n", + "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6955.898 | N/A\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.158 | 6.856\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - loss | 0.450 | 6.804\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - LAS | 0.945 | 0.903\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2426.041 | N/A\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 02:27:34,651 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 02:27:38,944 - INFO - combo.training.trainer - Epoch duration: 0:00:57.242174\n", + "2023-04-07 02:27:38,945 - INFO - combo.training.trainer - Estimated training time remaining: 3:46:56\n", + "2023-04-07 02:27:38,945 - INFO - allennlp.training.trainer - Epoch 196/399\n", + "2023-04-07 02:27:38,945 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n", + "2023-04-07 02:27:38,946 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 02:27:38,956 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/95 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9574, UAS: 0.9680, LAS: 0.9432, UEM: 0.6083, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2071, partial_loss/deprel_loss: 0.2123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3913, loss: 0.4754, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||: 5%|5 | 5/95 [00:02<00:41, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9652, LAS: 0.9405, UEM: 0.5337, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5089, partial_loss/deprel_loss: 0.3847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.4913, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||: 11%|# | 10/95 [00:04<00:38, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9419, UAS: 0.9684, LAS: 0.9435, UEM: 0.6476, LEM: 0.4498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3862, partial_loss/deprel_loss: 0.3155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.4663, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||: 16%|#5 | 15/95 [00:06<00:36, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9702, LAS: 0.9457, UEM: 0.7184, LEM: 0.5454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.2818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4979, loss: 0.4515, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||: 20%|## | 19/95 [00:08<00:36, 2.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9711, LAS: 0.9459, UEM: 0.7201, LEM: 0.5365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1590, partial_loss/deprel_loss: 0.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3893, loss: 0.4462, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||: 25%|##5 | 24/95 [00:10<00:32, 2.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9717, LAS: 0.9463, UEM: 0.7125, LEM: 0.5195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1199, partial_loss/deprel_loss: 0.1988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3629, loss: 0.4442, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||: 32%|###1 | 30/95 [00:13<00:28, 2.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9511, UAS: 0.9710, LAS: 0.9456, UEM: 0.6994, LEM: 0.5027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2418, partial_loss/deprel_loss: 0.2540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4315, loss: 0.4491, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||: 38%|###7 | 36/95 [00:15<00:25, 2.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9713, LAS: 0.9459, UEM: 0.7014, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2789, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4648, loss: 0.4461, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||: 43%|####3 | 41/95 [00:17<00:22, 2.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9491, UAS: 0.9716, LAS: 0.9463, UEM: 0.7029, LEM: 0.5023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.2487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4169, loss: 0.4436, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||: 48%|####8 | 46/95 [00:20<00:21, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9721, LAS: 0.9468, UEM: 0.7241, LEM: 0.5305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0812, partial_loss/deprel_loss: 0.1878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3463, loss: 0.4396, batch_reg_loss: 0.1799, reg_loss: 0.1799 ||: 54%|#####3 | 51/95 [00:22<00:19, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9718, LAS: 0.9463, UEM: 0.7154, LEM: 0.5183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1933, partial_loss/deprel_loss: 0.2721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4362, loss: 0.4425, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 59%|#####8 | 56/95 [00:24<00:16, 2.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9707, LAS: 0.9449, UEM: 0.7084, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8299, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6945, loss: 0.4511, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 64%|######4 | 61/95 [00:26<00:15, 2.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9708, LAS: 0.9450, UEM: 0.7059, LEM: 0.5047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1677, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.4509, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 69%|######9 | 66/95 [00:28<00:12, 2.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9704, LAS: 0.9446, UEM: 0.7017, LEM: 0.5009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1216, partial_loss/deprel_loss: 0.2030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3665, loss: 0.4535, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 75%|#######4 | 71/95 [00:31<00:10, 2.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9707, LAS: 0.9448, UEM: 0.7072, LEM: 0.5067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5046, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.4516, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 80%|######## | 76/95 [00:33<00:08, 2.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9706, LAS: 0.9446, UEM: 0.7021, LEM: 0.5010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4056, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.4530, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 85%|########5 | 81/95 [00:35<00:06, 2.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9711, LAS: 0.9451, UEM: 0.7149, LEM: 0.5145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1468, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4155, loss: 0.4493, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||: 91%|######### | 86/95 [00:37<00:03, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9708, LAS: 0.9447, UEM: 0.7110, LEM: 0.5093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.2541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4238, loss: 0.4509, batch_reg_loss: 0.1797, reg_loss: 0.1799 ||: 96%|#########5| 91/95 [00:39<00:01, 2.24it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9712, LAS: 0.9451, UEM: 0.7205, LEM: 0.5204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0793, partial_loss/deprel_loss: 0.1742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3349, loss: 0.4479, batch_reg_loss: 0.1797, reg_loss: 0.1799 ||: 100%|##########| 95/95 [00:41<00:00, 2.27it/s]\n", + "2023-04-07 02:28:24,033 - INFO - combo.training.trainer - Ran out of patience. Stopping training.\n", + "2023-04-07 02:28:24,034 - INFO - allennlp.training.checkpointer - loading best weights\n", + "2023-04-07 02:28:25,595 - INFO - allennlp.common.util - Metrics: {\n", + " \"best_epoch\": 195,\n", + " \"peak_worker_0_memory_MB\": 6955.8984375,\n", + " \"peak_gpu_0_memory_MB\": 2426.04052734375,\n", + " \"training_duration\": \"3:37:58.447135\",\n", + " \"training_start_epoch\": 0,\n", + " \"training_epochs\": 195,\n", + " \"epoch\": 195,\n", + " \"training_UPOS_ACC\": 0.0,\n", + " \"training_XPOS_ACC\": 0.0,\n", + " \"training_SEMREL_ACC\": 0.0,\n", + " \"training_LEMMA_ACC\": 0.0,\n", + " \"training_FEATS_ACC\": 0.0,\n", + " \"training_EM\": 0.9572854042053223,\n", + " \"training_UAS\": 0.9701954834274984,\n", + " \"training_LAS\": 0.9448924505842707,\n", + " \"training_UEM\": 0.7148521082441788,\n", + " \"training_LEM\": 0.5208936438011328,\n", + " \"training_EUAS\": 0.0,\n", + " \"training_ELAS\": 0.0,\n", + " \"training_EUEM\": 0.0,\n", + " \"training_ELEM\": 0.0,\n", + " \"training_partial_loss/head_loss\": 0.08596646785736084,\n", + " \"training_partial_loss/deprel_loss\": 0.15788140892982483,\n", + " \"training_partial_loss/cycle_loss\": 0.0,\n", + " \"training_loss\": 0.4496598549579319,\n", + " \"training_reg_loss\": 0.18018160729031812,\n", + " \"training_worker_0_memory_MB\": 6955.8984375,\n", + " \"training_gpu_0_memory_MB\": 2426.04052734375,\n", + " \"training_patience\": 1,\n", + " \"validation_UPOS_ACC\": 0.0,\n", + " \"validation_XPOS_ACC\": 0.0,\n", + " \"validation_SEMREL_ACC\": 0.0,\n", + " \"validation_LEMMA_ACC\": 0.0,\n", + " \"validation_FEATS_ACC\": 0.0,\n", + " \"validation_EM\": 0.9029048681259155,\n", + " \"validation_UAS\": 0.9531431054461182,\n", + " \"validation_LAS\": 0.9027375434530707,\n", + " \"validation_UEM\": 0.690843621399177,\n", + " \"validation_LEM\": 0.4182098765432099,\n", + " \"validation_EUAS\": 0.0,\n", + " \"validation_ELAS\": 0.0,\n", + " \"validation_EUEM\": 0.0,\n", + " \"validation_ELEM\": 0.0,\n", + " \"validation_partial_loss/head_loss\": 0.5501478910446167,\n", + " \"validation_partial_loss/deprel_loss\": 6.855911731719971,\n", + " \"validation_partial_loss/cycle_loss\": 0.0,\n", + " \"validation_loss\": 6.80415695363825,\n", + " \"validation_reg_loss\": 0.0,\n", + " \"best_validation_UPOS_ACC\": 0.0,\n", + " \"best_validation_XPOS_ACC\": 0.0,\n", + " \"best_validation_SEMREL_ACC\": 0.0,\n", + " \"best_validation_LEMMA_ACC\": 0.0,\n", + " \"best_validation_FEATS_ACC\": 0.0,\n", + " \"best_validation_EM\": 0.9029048681259155,\n", + " \"best_validation_UAS\": 0.9531431054461182,\n", + " \"best_validation_LAS\": 0.9027375434530707,\n", + " \"best_validation_UEM\": 0.690843621399177,\n", + " \"best_validation_LEM\": 0.4182098765432099,\n", + " \"best_validation_EUAS\": 0.0,\n", + " \"best_validation_ELAS\": 0.0,\n", + " \"best_validation_EUEM\": 0.0,\n", + " \"best_validation_ELEM\": 0.0,\n", + " \"best_validation_partial_loss/head_loss\": 0.5501478910446167,\n", + " \"best_validation_partial_loss/deprel_loss\": 6.855911731719971,\n", + " \"best_validation_partial_loss/cycle_loss\": 0.0,\n", + " \"best_validation_loss\": 6.80415695363825,\n", + " \"best_validation_reg_loss\": 0.0\n", + "}\n", + "2023-04-07 02:28:25,596 - INFO - allennlp.models.archival - archiving weights and vocabulary to ./allennlp867qpopk/model.tar.gz\n", + "2023-04-07 02:40:44,065 - INFO - combo.main - Training model stored in: ./allennlp867qpopk\n" + ] + } + ], + "source": [ + "! {COMBO} --mode train \\\n", + " --training_data_path connlu/pdbc-cont-train.conllu \\\n", + " --validation_data_path connlu/pdbc-cont-validation.conllu \\\n", + " --cuda_device 0 \\\n", + " --pretrained_transformer_name allegro/herbert-large-cased \\\n", + " --targets head,deprel \\\n", + " --serialization_dir ." + ] + }, + { + "cell_type": "markdown", + "id": "74363e00", + "metadata": {}, + "source": [ + "Change `allennlp...` to the directory produced by COMBO." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "ae258726", + "metadata": {}, + "outputs": [], + "source": [ + "! rm -r model-pdbc-cont/\n", + "! mv allennlp867qpopk/ model-pdbc-cont/" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "combo_python39", + "language": "python", + "name": "combo_python39" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.16" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/COMBO/TrainModel.ipynb a/COMBO/TrainModel.ipynb new file mode 100644 index 0000000..f327a58 --- /dev/null +++ a/COMBO/TrainModel.ipynb @@ -0,0 +1,11222 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "aabfb24b", + "metadata": {}, + "outputs": [], + "source": [ + "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "54a97ebd", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "I0406 22:49:19.084177 139884283720768 params.py:248] include_in_archive = None\n", + "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - random_seed = 8787\n", + "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - numpy_seed = 8787\n", + "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - pytorch_seed = 8787\n", + "2023-04-06 22:49:19,086 - INFO - allennlp.common.checks - Pytorch version: 1.13.1\n", + "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - type = default\n", + "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - dataset_reader.type = conllu\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.lazy = False\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.cache_directory = None\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.max_instances = None\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_distributed_sharding = False\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_multi_process_sharding = False\n", + "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.type = characters_const_padding\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.namespace = token_characters\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.start_tokens = None\n", + "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.end_tokens = None\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.min_padding_length = 32\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.token_min_padding_length = 0\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.type = feats_indexer\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.namespace = feats\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.feature_name = feats_\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.token_min_padding_length = 0\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.type = characters_const_padding\n", + "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.namespace = token_characters\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.start_tokens = None\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.end_tokens = None\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.min_padding_length = 32\n", + "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.token_min_padding_length = 0\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.namespace = tags\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.max_length = None\n", + "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n", + "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.type = single_id\n", + "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.namespace = upostag\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.lowercase_tokens = False\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.start_tokens = None\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.end_tokens = None\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.feature_name = pos_\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.type = single_id\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.namespace = xpostag\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.start_tokens = None\n", + "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.end_tokens = None\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.feature_name = tag_\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.type = characters_const_padding\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.namespace = lemma_characters\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n", + "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.start_tokens = None\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.end_tokens = None\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.min_padding_length = 32\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.features = ['token', 'char']\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.targets = ['head', 'deprel']\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.use_sem = False\n", + "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - train_data_path = connlu/pdbc-train.conllu\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - datasets_for_vocab_creation = ['train']\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_dataset_reader = None\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_path = connlu/pdbc-validation.conllu\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_loader = None\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - test_data_path = None\n", + "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - evaluate_on_test = False\n", + "2023-04-06 22:49:21,862 - INFO - allennlp.common.params - batch_weight_key = \n", + "2023-04-06 22:49:21,862 - INFO - allennlp.training.util - Reading training data from connlu/pdbc-train.conllu\n", + "reading instances: 0it [00:00, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "reading instances: 3853it [00:02, 1926.46it/s]\n", + "reading instances: 8024it [00:04, 1907.69it/s]\n", + "reading instances: 11424it [00:06, 1840.15it/s]\n", + "reading instances: 14555it [00:08, 1654.52it/s]\n", + "reading instances: 17659it [00:09, 1772.69it/s]\n", + "2023-04-06 22:49:31,824 - INFO - allennlp.training.util - Reading validation data from connlu/pdbc-validation.conllu\n", + "reading instances: 0it [00:00, ?it/s]\n", + "reading instances: 1851it [00:02, 897.46it/s]\n", + "reading instances: 2211it [00:02, 933.13it/s]\n", + "2023-04-06 22:49:34,194 - INFO - allennlp.commands.train - From dataset instances, train will be considered for vocabulary creation.\n", + "2023-04-06 22:49:34,194 - INFO - allennlp.common.params - vocabulary.type = from_instances_extended\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_count = None\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.max_vocab_size = None\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.non_padded_namespaces = ['head_labels']\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.pretrained_files = None\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.only_include_pretrained_words = True\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_pretrained_embeddings = None\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.padding_token = __PAD__\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.oov_token = _\n", + "2023-04-06 22:49:34,195 - INFO - allennlp.data.vocabulary - Fitting token dictionary from dataset.\n", + "building vocab: 0it [00:00, ?it/s]\n", + "building vocab: 16773it [00:02, 8386.16it/s]\n", + "building vocab: 17659it [00:02, 8423.42it/s]\n", + "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.type = semantic_multitask\n", + "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.text_field_embedder.type = basic\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.embedding_dim = 64\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n", + "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n", + "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n", + "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n", + "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n", + "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = linear\n", + "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n", + "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n", + "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dim = 100\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f388b745280>\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.freeze_transformer = True\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.last_layer_only = True\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n", + "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n", + "2023-04-06 22:49:44,104 - INFO - allennlp.common.params - model.seq_encoder.type = combo_encoder\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.input_size = 164\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.hidden_size = 512\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.num_layers = 2\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n", + "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.use_highway = False\n", + "2023-04-06 22:49:44,804 - INFO - allennlp.common.params - model.seq_encoder.layer_dropout_probability = 0.33\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.use_sample_weight = True\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.lemmatizer = None\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.upos_tagger = None\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.xpos_tagger = None\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.semantic_relation = None\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.morphological_feat = None\n", + "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.dependency_relation.type = combo_dependency_parsing_from_vocab\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.vocab_namespace = deprel_labels\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n", + "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n", + "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n", + "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.cycle_loss_n = 0\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.out_features = 128\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.activation = tanh\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n", + "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.in_features = 1024\n", + "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.out_features = 128\n", + "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.activation = tanh\n", + "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - type = tanh\n", + "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n", + "2023-04-06 22:49:44,820 - INFO - allennlp.common.params - model.enhanced_dependency_relation = None\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.type = l2\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.alpha = 1e-06\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.type = l2\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.alpha = 1e-06\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.type = l2\n", + "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.alpha = 1e-06\n", + "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.type = l2\n", + "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.alpha = 1e-05\n", + "2023-04-06 22:49:44,822 - INFO - filelock - Lock 139878665944848 acquired on ./allennlpru3hb8qq/vocabulary/.lock\n", + "2023-04-06 22:49:44,823 - INFO - filelock - Lock 139878665944848 released on ./allennlpru3hb8qq/vocabulary/.lock\n", + "2023-04-06 22:49:44,823 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batch_size = 1\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.shuffle = False\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.sampler = None\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.num_workers = 0\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.pin_memory = False\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.drop_last = False\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.timeout = 0\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n", + "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n", + "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n", + "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n", + "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n", + "/home/kkrasnowska/anaconda3/envs/combo_p39/lib/python3.8/site-packages/combo/data/samplers/samplers.py:51: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n", + " self.batch_dataset = np.array(self.batch_dataset)[indices].tolist()\n", + "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n", + "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.batch_size = 1\n", + "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.shuffle = False\n", + "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.sampler = None\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.num_workers = 0\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.pin_memory = False\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.drop_last = False\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.timeout = 0\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n", + "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n", + "2023-04-06 22:49:44,849 - INFO - allennlp.common.params - trainer.type = gradient_descent_validate_n\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.patience = 1\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.validation_metric = +EM\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_epochs = 400\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.cuda_device = 0\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_norm = None\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_clipping = 5\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.distributed = None\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.world_size = 1\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_gradient_accumulation_steps = 1\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.use_amp = False\n", + "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.no_grad = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.momentum_scheduler = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.tensorboard_writer = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.moving_average = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.batch_callbacks = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.epoch_callbacks.0.type = transfer_patience\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.end_callbacks = None\n", + "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.trainer_callbacks = None\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.type = adam\r\n", + "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.parameter_groups = None\r\n", + "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.lr = 0.002\r\n", + "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.betas = [0.9, 0.9]\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.eps = 1e-08\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.weight_decay = 0.0\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.amsgrad = False\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.training.optimizers - Number of trainable parameters: 11053872\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - The following parameters are Frozen (without gradient):\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.word_embeddings.weight\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.position_embeddings.weight\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.token_type_embeddings.weight\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.weight\r\n", + "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.weight\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.bias\r\n", + "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.bias\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.bias\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.bias\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.weight\r\n", + "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.weight\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.bias\r\n", + "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - The following parameters are Tunable (with gradient):\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - _head_sentinel\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.char_embed.weight\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.weight\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.bias\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.weight\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.bias\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.weight\r\n", + "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.bias\r\n", + "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.weight\r\n", + "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.bias\r\n", + "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.input_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.weight\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.bias\r\n", + "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.weight\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.bias\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.weight\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.bias\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.type = combo_scheduler\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.patience = 6\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.decreases = 2\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.threshold = 0.001\r\n", + "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.checkpointer.type = finishing_only_checkpointer\r\n", + "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.keep_serialized_model_every_num_seconds = None\r\n", + "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.num_serialized_models_to_keep = 2\r\n", + "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.model_save_interval = None\r\n", + "2023-04-06 22:49:47,308 - INFO - combo.training.trainer - Beginning training.\r\n", + "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Epoch 0/399\r\n", + "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.3G\r\n", + "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - GPU 0 memory usage: 1.4G\r\n", + "2023-04-06 22:49:47,315 - INFO - allennlp.training.trainer - Training\r\n", + " 0%| | 0/111 [00:00<?, ?it/s]\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0492, LAS: 0.0000, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7155, partial_loss/deprel_loss: 12.9573, partial_loss/cycle_loss: 0.0000, batch_loss: 12.4107, loss: 12.4107, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||: 1%| | 1/111 [00:03<07:00, 3.82s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0559, LAS: 0.0045, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.7004, partial_loss/deprel_loss: 16.3879, partial_loss/cycle_loss: 0.0000, batch_loss: 17.1516, loss: 25.2089, batch_reg_loss: 0.1012, reg_loss: 0.1015 ||: 4%|3 | 4/111 [00:06<05:11, 2.91s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0120, UAS: 0.0714, LAS: 0.0044, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 22.1129, partial_loss/deprel_loss: 9.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 11.7916, loss: 24.6851, batch_reg_loss: 0.1006, reg_loss: 0.1012 ||: 6%|6 | 7/111 [00:08<03:56, 2.27s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0099, UAS: 0.0608, LAS: 0.0046, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.5869, partial_loss/deprel_loss: 9.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7085, loss: 21.3806, batch_reg_loss: 0.1000, reg_loss: 0.1009 ||: 9%|9 | 10/111 [00:10<03:01, 1.80s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0315, UAS: 0.0725, LAS: 0.0092, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 18.3275, partial_loss/deprel_loss: 7.1568, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4905, loss: 18.5717, batch_reg_loss: 0.0995, reg_loss: 0.1006 ||: 12%|#1 | 13/111 [00:12<02:26, 1.49s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0633, LAS: 0.0083, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 25.8989, partial_loss/deprel_loss: 11.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 14.6935, loss: 17.9697, batch_reg_loss: 0.0991, reg_loss: 0.1003 ||: 14%|#4 | 16/111 [00:15<01:59, 1.26s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0064, UAS: 0.0604, LAS: 0.0079, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 16.1143, partial_loss/deprel_loss: 10.8376, partial_loss/cycle_loss: 0.0000, batch_loss: 11.9915, loss: 16.8737, batch_reg_loss: 0.0986, reg_loss: 0.1001 ||: 17%|#7 | 19/111 [00:17<01:39, 1.08s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0079, UAS: 0.0579, LAS: 0.0081, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.2368, partial_loss/deprel_loss: 10.3155, partial_loss/cycle_loss: 0.0000, batch_loss: 11.3978, loss: 16.0851, batch_reg_loss: 0.0981, reg_loss: 0.0998 ||: 20%|#9 | 22/111 [00:19<01:25, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0259, UAS: 0.0602, LAS: 0.0091, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 13.9253, partial_loss/deprel_loss: 7.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 8.8288, loss: 15.3859, batch_reg_loss: 0.0976, reg_loss: 0.0996 ||: 23%|##2 | 25/111 [00:21<01:17, 1.11it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0267, UAS: 0.0629, LAS: 0.0101, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 23.9539, partial_loss/deprel_loss: 6.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 10.0631, loss: 14.9031, batch_reg_loss: 0.0971, reg_loss: 0.0994 ||: 25%|##5 | 28/111 [00:23<01:10, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0139, UAS: 0.0629, LAS: 0.0103, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.2664, partial_loss/deprel_loss: 8.1915, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5031, loss: 14.5860, batch_reg_loss: 0.0966, reg_loss: 0.0991 ||: 28%|##7 | 31/111 [00:25<01:04, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0056, UAS: 0.0635, LAS: 0.0105, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.2399, partial_loss/deprel_loss: 9.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7789, loss: 14.1692, batch_reg_loss: 0.0961, reg_loss: 0.0989 ||: 31%|### | 34/111 [00:27<01:00, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0148, UAS: 0.0660, LAS: 0.0107, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0003, partial_loss/deprel_loss: 6.0032, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4982, loss: 13.6788, batch_reg_loss: 0.0956, reg_loss: 0.0986 ||: 33%|###3 | 37/111 [00:30<00:58, 1.26it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0159, UAS: 0.0717, LAS: 0.0140, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.5919, partial_loss/deprel_loss: 8.8836, partial_loss/cycle_loss: 0.0000, batch_loss: 9.3203, loss: 13.2278, batch_reg_loss: 0.0950, reg_loss: 0.0983 ||: 36%|###6 | 40/111 [00:32<00:58, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0160, UAS: 0.0744, LAS: 0.0148, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1016, partial_loss/deprel_loss: 9.2769, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5363, loss: 12.8973, batch_reg_loss: 0.0945, reg_loss: 0.0981 ||: 39%|###8 | 43/111 [00:34<00:52, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0467, UAS: 0.0768, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8362, partial_loss/deprel_loss: 6.5938, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5361, loss: 12.5863, batch_reg_loss: 0.0939, reg_loss: 0.0978 ||: 41%|####1 | 46/111 [00:37<00:49, 1.31it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0130, UAS: 0.0790, LAS: 0.0162, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.9970, partial_loss/deprel_loss: 11.0561, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5376, loss: 12.3941, batch_reg_loss: 0.0933, reg_loss: 0.0976 ||: 44%|####4 | 49/111 [00:39<00:46, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0044, UAS: 0.0785, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.6006, partial_loss/deprel_loss: 11.6897, partial_loss/cycle_loss: 0.0000, batch_loss: 12.3646, loss: 12.3354, batch_reg_loss: 0.0927, reg_loss: 0.0973 ||: 47%|####6 | 52/111 [00:41<00:43, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0115, UAS: 0.0791, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.7207, partial_loss/deprel_loss: 11.0801, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5003, loss: 12.2236, batch_reg_loss: 0.0921, reg_loss: 0.0970 ||: 50%|####9 | 55/111 [00:43<00:42, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0243, UAS: 0.0817, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.6552, partial_loss/deprel_loss: 7.4151, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3545, loss: 12.0074, batch_reg_loss: 0.0915, reg_loss: 0.0967 ||: 52%|#####2 | 58/111 [00:45<00:38, 1.36it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0191, UAS: 0.0860, LAS: 0.0174, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.0116, partial_loss/deprel_loss: 10.2631, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5036, loss: 11.7766, batch_reg_loss: 0.0908, reg_loss: 0.0965 ||: 55%|#####4 | 61/111 [00:48<00:38, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0343, UAS: 0.0937, LAS: 0.0194, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9906, partial_loss/deprel_loss: 8.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4916, loss: 11.4687, batch_reg_loss: 0.0900, reg_loss: 0.0961 ||: 59%|#####8 | 65/111 [00:50<00:33, 1.38it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0919, UAS: 0.0972, LAS: 0.0205, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0429, partial_loss/deprel_loss: 5.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3323, loss: 11.3481, batch_reg_loss: 0.0893, reg_loss: 0.0958 ||: 61%|######1 | 68/111 [00:53<00:33, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0574, UAS: 0.1052, LAS: 0.0221, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5849, partial_loss/deprel_loss: 6.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7516, loss: 11.1225, batch_reg_loss: 0.0885, reg_loss: 0.0954 ||: 65%|######4 | 72/111 [00:56<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0301, UAS: 0.1099, LAS: 0.0231, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.2882, partial_loss/deprel_loss: 9.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4663, loss: 10.9824, batch_reg_loss: 0.0878, reg_loss: 0.0951 ||: 68%|######7 | 75/111 [01:00<00:33, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0518, UAS: 0.1162, LAS: 0.0250, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.7446, partial_loss/deprel_loss: 8.7894, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6676, loss: 10.8571, batch_reg_loss: 0.0872, reg_loss: 0.0948 ||: 70%|####### | 78/111 [01:02<00:29, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0834, UAS: 0.1219, LAS: 0.0265, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8250, partial_loss/deprel_loss: 7.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 7.1244, loss: 10.7374, batch_reg_loss: 0.0866, reg_loss: 0.0945 ||: 73%|#######2 | 81/111 [01:04<00:24, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0427, UAS: 0.1239, LAS: 0.0269, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.8399, partial_loss/deprel_loss: 10.0552, partial_loss/cycle_loss: 0.0000, batch_loss: 10.2981, loss: 10.7271, batch_reg_loss: 0.0860, reg_loss: 0.0942 ||: 76%|#######5 | 84/111 [01:07<00:22, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0643, UAS: 0.1288, LAS: 0.0287, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8981, partial_loss/deprel_loss: 9.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5488, loss: 10.6448, batch_reg_loss: 0.0854, reg_loss: 0.0939 ||: 78%|#######8 | 87/111 [01:09<00:19, 1.24it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0661, UAS: 0.1356, LAS: 0.0319, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.0897, partial_loss/deprel_loss: 9.0732, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1614, loss: 10.5082, batch_reg_loss: 0.0849, reg_loss: 0.0936 ||: 81%|########1 | 90/111 [01:12<00:17, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0714, UAS: 0.1426, LAS: 0.0350, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.3305, partial_loss/deprel_loss: 8.5479, partial_loss/cycle_loss: 0.0000, batch_loss: 8.5886, loss: 10.3707, batch_reg_loss: 0.0842, reg_loss: 0.0932 ||: 85%|########4 | 94/111 [01:14<00:12, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0987, UAS: 0.1504, LAS: 0.0398, UEM: 0.0005, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8474, partial_loss/deprel_loss: 6.8979, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7715, loss: 10.2165, batch_reg_loss: 0.0837, reg_loss: 0.0929 ||: 87%|########7 | 97/111 [01:17<00:10, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0733, UAS: 0.1541, LAS: 0.0412, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.9606, partial_loss/deprel_loss: 9.1819, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4208, loss: 10.1551, batch_reg_loss: 0.0831, reg_loss: 0.0927 ||: 90%|######### | 100/111 [01:19<00:08, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0887, UAS: 0.1585, LAS: 0.0433, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.6073, partial_loss/deprel_loss: 8.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6506, loss: 10.0863, batch_reg_loss: 0.0826, reg_loss: 0.0924 ||: 93%|#########2| 103/111 [01:21<00:06, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0763, UAS: 0.1650, LAS: 0.0476, UEM: 0.0015, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8387, partial_loss/deprel_loss: 8.8138, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1009, loss: 9.9700, batch_reg_loss: 0.0821, reg_loss: 0.0921 ||: 95%|#########5| 106/111 [01:24<00:04, 1.15it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1713, UAS: 0.1692, LAS: 0.0496, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5725, partial_loss/deprel_loss: 5.1460, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1130, loss: 9.8781, batch_reg_loss: 0.0817, reg_loss: 0.0918 ||: 98%|#########8| 109/111 [01:27<00:01, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1029, UAS: 0.1708, LAS: 0.0502, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.0519, partial_loss/deprel_loss: 7.4492, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4511, loss: 9.8521, batch_reg_loss: 0.0813, reg_loss: 0.0916 ||: 100%|##########| 111/111 [01:28<00:00, 1.25it/s]\n", + "2023-04-06 22:51:15,927 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1167, UAS: 0.3116, LAS: 0.1456, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9999, partial_loss/deprel_loss: 15.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 13.8275, loss: 12.0213, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:12, 1.11s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2614, UAS: 0.3885, LAS: 0.1921, UEM: 0.0012, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.7361, partial_loss/deprel_loss: 8.9365, partial_loss/cycle_loss: 0.0000, batch_loss: 7.8964, loss: 10.3315, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 31%|### | 4/13 [00:04<00:10, 1.15s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1863, UAS: 0.3556, LAS: 0.1713, UEM: 0.0009, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5918, partial_loss/deprel_loss: 8.8550, partial_loss/cycle_loss: 0.0000, batch_loss: 8.2024, loss: 11.6787, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:07<00:08, 1.17s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1274, UAS: 0.3363, LAS: 0.1580, UEM: 0.0008, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5021, partial_loss/deprel_loss: 14.9977, partial_loss/cycle_loss: 0.0000, batch_loss: 13.4986, loss: 12.1599, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:09<00:05, 1.17s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0952, UAS: 0.3134, LAS: 0.1427, UEM: 0.0007, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.8305, partial_loss/deprel_loss: 17.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9268, loss: 13.2406, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:12<00:03, 1.20s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3824, UAS: 0.3342, LAS: 0.1583, UEM: 0.0460, LEM: 0.0089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 6.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5923, loss: 12.9753, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:14<00:01, 1.20s/it] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1377, UAS: 0.3324, LAS: 0.1568, UEM: 0.0427, LEM: 0.0083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.7160, partial_loss/deprel_loss: 11.9092, partial_loss/cycle_loss: 0.0000, batch_loss: 10.8705, loss: 12.8134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:15<00:00, 1.18s/it]\n", + "2023-04-06 22:51:31,252 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 7.449 | 11.909\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 7.052 | 6.716\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - reg_loss | 0.092 | 0.000\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UEM | 0.001 | 0.043\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LAS | 0.050 | 0.157\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - loss | 9.852 | 12.813\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 1397.911 | N/A\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEM | 0.000 | 0.008\n", + "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - UAS | 0.171 | 0.332\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EM | 0.103 | 0.138\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 6486.516 | N/A\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Epoch duration: 0:01:43.946313\n", + "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Estimated training time remaining: 11:31:14\n", + "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Epoch 1/399\n", + "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:51:31,255 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:51:31,259 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5026, UAS: 0.5009, LAS: 0.2748, UEM: 0.3237, LEM: 0.0478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 2.2067, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0384, loss: 4.7510, batch_reg_loss: 0.0809, reg_loss: 0.0810 ||: 3%|2 | 3/111 [00:02<01:25, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2153, UAS: 0.4222, LAS: 0.2111, UEM: 0.2335, LEM: 0.0345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8553, partial_loss/deprel_loss: 5.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1419, loss: 5.9501, batch_reg_loss: 0.0804, reg_loss: 0.0808 ||: 5%|5 | 6/111 [00:04<01:21, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1178, UAS: 0.3878, LAS: 0.1808, UEM: 0.1884, LEM: 0.0278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1742, partial_loss/deprel_loss: 7.5720, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5724, loss: 6.4967, batch_reg_loss: 0.0800, reg_loss: 0.0806 ||: 8%|8 | 9/111 [00:06<01:17, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1538, UAS: 0.3796, LAS: 0.1788, UEM: 0.1554, LEM: 0.0230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.8665, partial_loss/deprel_loss: 7.3143, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3044, loss: 6.6142, batch_reg_loss: 0.0796, reg_loss: 0.0804 ||: 11%|# | 12/111 [00:08<01:14, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3034, UAS: 0.3993, LAS: 0.1915, UEM: 0.1191, LEM: 0.0176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8777, partial_loss/deprel_loss: 4.3489, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1338, loss: 6.2776, batch_reg_loss: 0.0791, reg_loss: 0.0801 ||: 14%|#3 | 15/111 [00:11<01:10, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0891, UAS: 0.4053, LAS: 0.1952, UEM: 0.0993, LEM: 0.0147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.4397, partial_loss/deprel_loss: 9.1175, partial_loss/cycle_loss: 0.0000, batch_loss: 9.6606, loss: 6.2553, batch_reg_loss: 0.0787, reg_loss: 0.0799 ||: 16%|#6 | 18/111 [00:13<01:07, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1735, UAS: 0.3983, LAS: 0.1911, UEM: 0.0899, LEM: 0.0133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8049, partial_loss/deprel_loss: 6.6946, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5950, loss: 6.3528, batch_reg_loss: 0.0783, reg_loss: 0.0797 ||: 19%|#8 | 21/111 [00:15<01:03, 1.41it/s] \n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2083, UAS: 0.3981, LAS: 0.1902, UEM: 0.0799, LEM: 0.0118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1757, partial_loss/deprel_loss: 6.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 6.0662, loss: 6.4057, batch_reg_loss: 0.0778, reg_loss: 0.0794 ||: 23%|##2 | 25/111 [00:17<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2246, UAS: 0.4012, LAS: 0.1929, UEM: 0.0725, LEM: 0.0107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8645, partial_loss/deprel_loss: 6.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5763, loss: 6.4495, batch_reg_loss: 0.0772, reg_loss: 0.0792 ||: 26%|##6 | 29/111 [00:19<00:53, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2794, UAS: 0.4082, LAS: 0.1982, UEM: 0.0672, LEM: 0.0099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1211, partial_loss/deprel_loss: 5.4412, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2540, loss: 6.4181, batch_reg_loss: 0.0768, reg_loss: 0.0790 ||: 29%|##8 | 32/111 [00:22<00:52, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4732, UAS: 0.4244, LAS: 0.2122, UEM: 0.0709, LEM: 0.0090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3779, partial_loss/deprel_loss: 2.8672, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6458, loss: 6.2343, batch_reg_loss: 0.0764, reg_loss: 0.0787 ||: 32%|###1 | 35/111 [00:24<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3141, UAS: 0.4378, LAS: 0.2248, UEM: 0.0649, LEM: 0.0081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3674, partial_loss/deprel_loss: 5.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1125, loss: 6.0777, batch_reg_loss: 0.0761, reg_loss: 0.0785 ||: 34%|###4 | 38/111 [00:26<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2198, UAS: 0.4458, LAS: 0.2334, UEM: 0.0596, LEM: 0.0074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.4857, partial_loss/deprel_loss: 7.1532, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2953, loss: 6.0151, batch_reg_loss: 0.0756, reg_loss: 0.0783 ||: 38%|###7 | 42/111 [00:28<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1855, UAS: 0.4456, LAS: 0.2364, UEM: 0.0564, LEM: 0.0070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.3300, partial_loss/deprel_loss: 7.6093, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0285, loss: 6.0670, batch_reg_loss: 0.0751, reg_loss: 0.0780 ||: 41%|####1 | 46/111 [00:31<00:41, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3267, UAS: 0.4538, LAS: 0.2458, UEM: 0.0542, LEM: 0.0064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.7855, partial_loss/deprel_loss: 5.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3551, loss: 5.9627, batch_reg_loss: 0.0747, reg_loss: 0.0778 ||: 45%|####5 | 50/111 [00:33<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2382, UAS: 0.4571, LAS: 0.2516, UEM: 0.0580, LEM: 0.0061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0241, partial_loss/deprel_loss: 6.9911, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2719, loss: 5.9374, batch_reg_loss: 0.0743, reg_loss: 0.0775 ||: 49%|####8 | 54/111 [00:36<00:38, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3417, UAS: 0.4640, LAS: 0.2595, UEM: 0.0551, LEM: 0.0057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.8885, partial_loss/deprel_loss: 5.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4367, loss: 5.8601, batch_reg_loss: 0.0740, reg_loss: 0.0773 ||: 51%|#####1 | 57/111 [00:38<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5159, UAS: 0.4709, LAS: 0.2672, UEM: 0.0535, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9516, partial_loss/deprel_loss: 3.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8855, loss: 5.7894, batch_reg_loss: 0.0737, reg_loss: 0.0772 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3337, UAS: 0.4761, LAS: 0.2741, UEM: 0.0511, LEM: 0.0052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5468, partial_loss/deprel_loss: 5.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6022, loss: 5.7441, batch_reg_loss: 0.0733, reg_loss: 0.0769 ||: 58%|#####7 | 64/111 [00:43<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4904, UAS: 0.4849, LAS: 0.2834, UEM: 0.0531, LEM: 0.0049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4105, partial_loss/deprel_loss: 3.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 3.2892, loss: 5.6526, batch_reg_loss: 0.0730, reg_loss: 0.0768 ||: 60%|###### | 67/111 [00:45<00:29, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4030, UAS: 0.4920, LAS: 0.2912, UEM: 0.0521, LEM: 0.0047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4853, partial_loss/deprel_loss: 4.8174, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8237, loss: 5.5778, batch_reg_loss: 0.0727, reg_loss: 0.0766 ||: 63%|######3 | 70/111 [00:47<00:28, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5730, UAS: 0.4957, LAS: 0.2965, UEM: 0.0518, LEM: 0.0046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8525, partial_loss/deprel_loss: 2.9431, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7975, loss: 5.5408, batch_reg_loss: 0.0724, reg_loss: 0.0764 ||: 66%|######5 | 73/111 [00:50<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6026, UAS: 0.5030, LAS: 0.3044, UEM: 0.0582, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 2.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1400, loss: 5.4648, batch_reg_loss: 0.0722, reg_loss: 0.0763 ||: 68%|######8 | 76/111 [00:52<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5257, UAS: 0.5093, LAS: 0.3114, UEM: 0.0590, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3376, partial_loss/deprel_loss: 3.2408, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1320, loss: 5.3956, batch_reg_loss: 0.0719, reg_loss: 0.0761 ||: 71%|#######1 | 79/111 [00:54<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4749, UAS: 0.5194, LAS: 0.3224, UEM: 0.0594, LEM: 0.0054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3244, partial_loss/deprel_loss: 4.0444, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9720, loss: 5.2892, batch_reg_loss: 0.0716, reg_loss: 0.0759 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3801, UAS: 0.5250, LAS: 0.3287, UEM: 0.0793, LEM: 0.0098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3332, partial_loss/deprel_loss: 5.2213, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3150, loss: 5.2322, batch_reg_loss: 0.0713, reg_loss: 0.0757 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6195, UAS: 0.5311, LAS: 0.3359, UEM: 0.0901, LEM: 0.0120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5655, partial_loss/deprel_loss: 2.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4416, loss: 5.1692, batch_reg_loss: 0.0711, reg_loss: 0.0756 ||: 80%|######## | 89/111 [01:01<00:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3892, UAS: 0.5363, LAS: 0.3422, UEM: 0.0929, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3758, partial_loss/deprel_loss: 4.9502, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1062, loss: 5.1101, batch_reg_loss: 0.0708, reg_loss: 0.0754 ||: 83%|########2 | 92/111 [01:03<00:14, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4308, UAS: 0.5397, LAS: 0.3464, UEM: 0.0947, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4937, partial_loss/deprel_loss: 4.5762, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6303, loss: 5.0772, batch_reg_loss: 0.0706, reg_loss: 0.0753 ||: 86%|########5 | 95/111 [01:05<00:12, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4948, UAS: 0.5455, LAS: 0.3534, UEM: 0.0926, LEM: 0.0121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4684, partial_loss/deprel_loss: 3.7837, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7909, loss: 5.0118, batch_reg_loss: 0.0703, reg_loss: 0.0751 ||: 89%|########9 | 99/111 [01:08<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5697, UAS: 0.5519, LAS: 0.3608, UEM: 0.0901, LEM: 0.0116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5438, partial_loss/deprel_loss: 3.1081, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0652, loss: 4.9450, batch_reg_loss: 0.0700, reg_loss: 0.0749 ||: 93%|#########2| 103/111 [01:11<00:05, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4417, UAS: 0.5557, LAS: 0.3658, UEM: 0.0879, LEM: 0.0113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9554, partial_loss/deprel_loss: 4.7208, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8375, loss: 4.9064, batch_reg_loss: 0.0697, reg_loss: 0.0747 ||: 96%|#########6| 107/111 [01:13<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 4.522 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 4.509 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - reg_loss | 0.075 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UEM | 0.086 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LAS | 0.369 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - loss | 4.890 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEM | 0.011 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UAS | 0.558 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EM | 0.456 | N/A\n", + "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Epoch duration: 0:01:16.269599\n", + "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Estimated training time remaining: 9:57:43\n", + "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Epoch 2/399\n", + "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:52:47,525 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:52:47,531 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4964, UAS: 0.6204, LAS: 0.4727, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5829, partial_loss/deprel_loss: 3.9397, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9376, loss: 4.4478, batch_reg_loss: 0.0693, reg_loss: 0.0693 ||: 3%|2 | 3/111 [00:02<01:15, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6479, UAS: 0.6977, LAS: 0.5419, UEM: 0.1026, LEM: 0.0106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4297, partial_loss/deprel_loss: 2.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2782, loss: 3.5690, batch_reg_loss: 0.0691, reg_loss: 0.0692 ||: 5%|5 | 6/111 [00:04<01:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4715, UAS: 0.6718, LAS: 0.5218, UEM: 0.0755, LEM: 0.0079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3314, partial_loss/deprel_loss: 4.2643, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3466, loss: 3.8142, batch_reg_loss: 0.0688, reg_loss: 0.0691 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6659, UAS: 0.6858, LAS: 0.5350, UEM: 0.0982, LEM: 0.0139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2351, partial_loss/deprel_loss: 2.0560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9605, loss: 3.6185, batch_reg_loss: 0.0687, reg_loss: 0.0690 ||: 12%|#1 | 13/111 [00:09<01:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4735, UAS: 0.6843, LAS: 0.5326, UEM: 0.0795, LEM: 0.0112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1403, partial_loss/deprel_loss: 4.2142, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2679, loss: 3.6370, batch_reg_loss: 0.0685, reg_loss: 0.0689 ||: 15%|#5 | 17/111 [00:11<01:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6194, UAS: 0.6898, LAS: 0.5366, UEM: 0.0818, LEM: 0.0096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6949, partial_loss/deprel_loss: 2.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4592, loss: 3.5757, batch_reg_loss: 0.0683, reg_loss: 0.0688 ||: 19%|#8 | 21/111 [00:14<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8213, UAS: 0.6979, LAS: 0.5455, UEM: 0.2170, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.8507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 3.5040, batch_reg_loss: 0.0681, reg_loss: 0.0687 ||: 23%|##2 | 25/111 [00:17<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5476, UAS: 0.7039, LAS: 0.5509, UEM: 0.1942, LEM: 0.0844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0957, partial_loss/deprel_loss: 3.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5103, loss: 3.4550, batch_reg_loss: 0.0679, reg_loss: 0.0686 ||: 26%|##6 | 29/111 [00:19<00:55, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4213, UAS: 0.7068, LAS: 0.5547, UEM: 0.2095, LEM: 0.0826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1965, partial_loss/deprel_loss: 4.9298, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2509, loss: 3.4173, batch_reg_loss: 0.0677, reg_loss: 0.0685 ||: 29%|##8 | 32/111 [00:21<00:54, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4924, UAS: 0.7115, LAS: 0.5588, UEM: 0.1968, LEM: 0.0746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.2653, partial_loss/deprel_loss: 4.2745, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3402, loss: 3.3855, batch_reg_loss: 0.0675, reg_loss: 0.0684 ||: 32%|###2 | 36/111 [00:24<00:49, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4861, UAS: 0.7136, LAS: 0.5609, UEM: 0.1834, LEM: 0.0689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9229, partial_loss/deprel_loss: 4.5551, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6960, loss: 3.3816, batch_reg_loss: 0.0673, reg_loss: 0.0683 ||: 36%|###6 | 40/111 [00:26<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5632, UAS: 0.7197, LAS: 0.5670, UEM: 0.2184, LEM: 0.0784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7730, partial_loss/deprel_loss: 3.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3032, loss: 3.3144, batch_reg_loss: 0.0672, reg_loss: 0.0682 ||: 40%|###9 | 44/111 [00:29<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6700, UAS: 0.7271, LAS: 0.5743, UEM: 0.2131, LEM: 0.0736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5173, partial_loss/deprel_loss: 2.2309, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1552, loss: 3.2352, batch_reg_loss: 0.0670, reg_loss: 0.0681 ||: 43%|####3 | 48/111 [00:32<00:42, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6822, UAS: 0.7298, LAS: 0.5776, UEM: 0.2081, LEM: 0.0692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4613, partial_loss/deprel_loss: 2.0556, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0036, loss: 3.1978, batch_reg_loss: 0.0668, reg_loss: 0.0680 ||: 47%|####6 | 52/111 [00:34<00:38, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5462, UAS: 0.7286, LAS: 0.5768, UEM: 0.2001, LEM: 0.0662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8922, partial_loss/deprel_loss: 3.8440, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9202, loss: 3.2158, batch_reg_loss: 0.0666, reg_loss: 0.0679 ||: 50%|##### | 56/111 [00:37<00:34, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6350, UAS: 0.7299, LAS: 0.5784, UEM: 0.1921, LEM: 0.0628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9702, partial_loss/deprel_loss: 2.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5707, loss: 3.2028, batch_reg_loss: 0.0665, reg_loss: 0.0678 ||: 54%|#####4 | 60/111 [00:39<00:31, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5091, UAS: 0.7325, LAS: 0.5817, UEM: 0.2037, LEM: 0.0652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4303, partial_loss/deprel_loss: 4.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2589, loss: 3.1722, batch_reg_loss: 0.0663, reg_loss: 0.0677 ||: 58%|#####7 | 64/111 [00:42<00:29, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7077, UAS: 0.7373, LAS: 0.5864, UEM: 0.2098, LEM: 0.0632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8847, partial_loss/deprel_loss: 1.6877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5933, loss: 3.1156, batch_reg_loss: 0.0661, reg_loss: 0.0677 ||: 61%|######1 | 68/111 [00:45<00:28, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6647, UAS: 0.7394, LAS: 0.5886, UEM: 0.2110, LEM: 0.0610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6878, partial_loss/deprel_loss: 2.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2747, loss: 3.0945, batch_reg_loss: 0.0660, reg_loss: 0.0676 ||: 65%|######4 | 72/111 [00:47<00:26, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.7455, LAS: 0.5957, UEM: 0.2179, LEM: 0.0604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9192, partial_loss/deprel_loss: 1.6239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5488, loss: 3.0243, batch_reg_loss: 0.0658, reg_loss: 0.0675 ||: 68%|######8 | 76/111 [00:50<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6129, UAS: 0.7469, LAS: 0.5972, UEM: 0.2108, LEM: 0.0580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4237, partial_loss/deprel_loss: 2.8786, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8533, loss: 3.0067, batch_reg_loss: 0.0657, reg_loss: 0.0674 ||: 72%|#######2 | 80/111 [00:52<00:20, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6110, UAS: 0.7481, LAS: 0.5991, UEM: 0.2070, LEM: 0.0563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7020, partial_loss/deprel_loss: 2.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9341, loss: 2.9940, batch_reg_loss: 0.0655, reg_loss: 0.0673 ||: 76%|#######5 | 84/111 [00:55<00:17, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6596, UAS: 0.7500, LAS: 0.6014, UEM: 0.2146, LEM: 0.0583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7501, partial_loss/deprel_loss: 2.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2817, loss: 2.9726, batch_reg_loss: 0.0654, reg_loss: 0.0672 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6643, UAS: 0.7513, LAS: 0.6027, UEM: 0.2091, LEM: 0.0562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8068, partial_loss/deprel_loss: 2.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3218, loss: 2.9569, batch_reg_loss: 0.0652, reg_loss: 0.0671 ||: 83%|########2 | 92/111 [01:00<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6382, UAS: 0.7496, LAS: 0.6019, UEM: 0.2044, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3354, partial_loss/deprel_loss: 2.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7691, loss: 2.9764, batch_reg_loss: 0.0651, reg_loss: 0.0670 ||: 86%|########6 | 96/111 [01:03<00:09, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6473, UAS: 0.7524, LAS: 0.6053, UEM: 0.2124, LEM: 0.0594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9798, partial_loss/deprel_loss: 2.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4257, loss: 2.9392, batch_reg_loss: 0.0650, reg_loss: 0.0670 ||: 90%|######### | 100/111 [01:06<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7644, UAS: 0.7557, LAS: 0.6091, UEM: 0.2193, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3145, loss: 2.9018, batch_reg_loss: 0.0649, reg_loss: 0.0669 ||: 93%|#########2| 103/111 [01:08<00:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7586, LAS: 0.6125, UEM: 0.2241, LEM: 0.0607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8481, partial_loss/deprel_loss: 1.5531, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4769, loss: 2.8675, batch_reg_loss: 0.0648, reg_loss: 0.0668 ||: 95%|#########5| 106/111 [01:10<00:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6552, UAS: 0.7581, LAS: 0.6123, UEM: 0.2194, LEM: 0.0593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0818, partial_loss/deprel_loss: 2.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4559, loss: 2.8710, batch_reg_loss: 0.0647, reg_loss: 0.0668 ||: 99%|#########9| 110/111 [01:13<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7592, LAS: 0.6135, UEM: 0.2213, LEM: 0.0596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 1.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4210, loss: 2.8579, batch_reg_loss: 0.0646, reg_loss: 0.0668 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.480 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.861 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - reg_loss | 0.067 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UEM | 0.221 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LAS | 0.614 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - loss | 2.858 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEM | 0.060 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UAS | 0.759 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EM | 0.747 | N/A\n", + "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Epoch duration: 0:01:13.964691\n", + "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Estimated training time remaining: 9:20:36\n", + "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Epoch 3/399\n", + "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:54:01,490 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:54:01,496 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5522, UAS: 0.7779, LAS: 0.6461, UEM: 0.4911, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8721, partial_loss/deprel_loss: 3.5902, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7111, loss: 2.6501, batch_reg_loss: 0.0646, reg_loss: 0.0646 ||: 3%|2 | 3/111 [00:02<01:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5244, UAS: 0.7464, LAS: 0.6105, UEM: 0.3157, LEM: 0.1195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4001, partial_loss/deprel_loss: 3.7685, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9592, loss: 2.9957, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||: 6%|6 | 7/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7839, UAS: 0.7827, LAS: 0.6504, UEM: 0.3397, LEM: 0.1092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6771, partial_loss/deprel_loss: 1.2152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1719, loss: 2.5749, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||: 9%|9 | 10/111 [00:07<01:15, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5962, UAS: 0.7864, LAS: 0.6557, UEM: 0.2923, LEM: 0.0888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4499, partial_loss/deprel_loss: 3.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3466, loss: 2.5323, batch_reg_loss: 0.0643, reg_loss: 0.0644 ||: 12%|#1 | 13/111 [00:09<01:15, 1.30it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7262, UAS: 0.7947, LAS: 0.6646, UEM: 0.2585, LEM: 0.0737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3265, partial_loss/deprel_loss: 2.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9340, loss: 2.4410, batch_reg_loss: 0.0642, reg_loss: 0.0644 ||: 14%|#4 | 16/111 [00:11<01:10, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.7977, LAS: 0.6674, UEM: 0.2444, LEM: 0.0644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9908, partial_loss/deprel_loss: 1.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4713, loss: 2.4127, batch_reg_loss: 0.0641, reg_loss: 0.0644 ||: 18%|#8 | 20/111 [00:14<01:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7616, UAS: 0.8064, LAS: 0.6763, UEM: 0.2720, LEM: 0.0723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6766, partial_loss/deprel_loss: 1.3444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 2.3152, batch_reg_loss: 0.0640, reg_loss: 0.0643 ||: 22%|##1 | 24/111 [00:17<01:01, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.8092, LAS: 0.6787, UEM: 0.2590, LEM: 0.0651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5602, loss: 2.2885, batch_reg_loss: 0.0639, reg_loss: 0.0643 ||: 25%|##5 | 28/111 [00:19<00:56, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6937, UAS: 0.8106, LAS: 0.6800, UEM: 0.2438, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7709, partial_loss/deprel_loss: 2.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2642, loss: 2.2836, batch_reg_loss: 0.0638, reg_loss: 0.0642 ||: 28%|##7 | 31/111 [00:21<00:54, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6296, UAS: 0.8098, LAS: 0.6796, UEM: 0.2471, LEM: 0.0589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8165, partial_loss/deprel_loss: 2.8907, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9396, loss: 2.2935, batch_reg_loss: 0.0637, reg_loss: 0.0642 ||: 31%|### | 34/111 [00:23<00:52, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7206, UAS: 0.8103, LAS: 0.6805, UEM: 0.2360, LEM: 0.0556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4751, partial_loss/deprel_loss: 1.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8562, loss: 2.2865, batch_reg_loss: 0.0637, reg_loss: 0.0641 ||: 33%|###3 | 37/111 [00:25<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7730, UAS: 0.8120, LAS: 0.6830, UEM: 0.2357, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 1.3218, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2718, loss: 2.2638, batch_reg_loss: 0.0636, reg_loss: 0.0641 ||: 37%|###6 | 41/111 [00:28<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7604, UAS: 0.8162, LAS: 0.6880, UEM: 0.2428, LEM: 0.0550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 1.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4763, loss: 2.2114, batch_reg_loss: 0.0635, reg_loss: 0.0640 ||: 40%|###9 | 44/111 [00:31<00:48, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6857, UAS: 0.8111, LAS: 0.6833, UEM: 0.2349, LEM: 0.0532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9399, partial_loss/deprel_loss: 2.2534, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2541, loss: 2.2633, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||: 42%|####2 | 47/111 [00:33<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5934, UAS: 0.8120, LAS: 0.6844, UEM: 0.2419, LEM: 0.0557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2585, partial_loss/deprel_loss: 3.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4829, loss: 2.2516, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||: 45%|####5 | 50/111 [00:35<00:43, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7835, UAS: 0.8132, LAS: 0.6859, UEM: 0.2388, LEM: 0.0539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 1.3395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2956, loss: 2.2403, batch_reg_loss: 0.0633, reg_loss: 0.0639 ||: 49%|####8 | 54/111 [00:37<00:39, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6621, UAS: 0.8141, LAS: 0.6874, UEM: 0.2512, LEM: 0.0626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2108, partial_loss/deprel_loss: 2.3082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3519, loss: 2.2189, batch_reg_loss: 0.0632, reg_loss: 0.0639 ||: 51%|#####1 | 57/111 [00:40<00:38, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.8126, LAS: 0.6865, UEM: 0.2518, LEM: 0.0619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7939, partial_loss/deprel_loss: 1.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3063, loss: 2.2319, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||: 55%|#####4 | 61/111 [00:42<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6531, UAS: 0.8133, LAS: 0.6870, UEM: 0.2467, LEM: 0.0600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5764, partial_loss/deprel_loss: 2.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7397, loss: 2.2260, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||: 58%|#####7 | 64/111 [00:44<00:32, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8168, LAS: 0.6906, UEM: 0.2563, LEM: 0.0609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 1.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 2.1896, batch_reg_loss: 0.0630, reg_loss: 0.0638 ||: 60%|###### | 67/111 [00:46<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7593, UAS: 0.8180, LAS: 0.6922, UEM: 0.2522, LEM: 0.0592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 1.5328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4947, loss: 2.1787, batch_reg_loss: 0.0630, reg_loss: 0.0637 ||: 63%|######3 | 70/111 [00:49<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.8196, LAS: 0.6948, UEM: 0.2829, LEM: 0.0893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 2.1589, batch_reg_loss: 0.0629, reg_loss: 0.0637 ||: 67%|######6 | 74/111 [00:52<00:27, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6841, UAS: 0.8216, LAS: 0.6972, UEM: 0.2908, LEM: 0.0913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9630, partial_loss/deprel_loss: 2.3586, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3423, loss: 2.1351, batch_reg_loss: 0.0628, reg_loss: 0.0637 ||: 69%|######9 | 77/111 [00:54<00:25, 1.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8176, LAS: 0.6935, UEM: 0.2843, LEM: 0.0890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5630, partial_loss/deprel_loss: 1.9479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9337, loss: 2.1812, batch_reg_loss: 0.0628, reg_loss: 0.0636 ||: 73%|#######2 | 81/111 [00:57<00:21, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7388, UAS: 0.8182, LAS: 0.6943, UEM: 0.2795, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1689, partial_loss/deprel_loss: 1.7263, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6775, loss: 2.1734, batch_reg_loss: 0.0627, reg_loss: 0.0636 ||: 77%|#######6 | 85/111 [00:59<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7027, UAS: 0.8202, LAS: 0.6969, UEM: 0.2926, LEM: 0.0965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7537, partial_loss/deprel_loss: 2.1230, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1117, loss: 2.1483, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||: 80%|######## | 89/111 [01:02<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7744, UAS: 0.8185, LAS: 0.6957, UEM: 0.2882, LEM: 0.0944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0477, partial_loss/deprel_loss: 1.4812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4571, loss: 2.1638, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||: 84%|########3 | 93/111 [01:04<00:11, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.8203, LAS: 0.6977, UEM: 0.2968, LEM: 0.0975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4458, partial_loss/deprel_loss: 0.9504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9120, loss: 2.1448, batch_reg_loss: 0.0625, reg_loss: 0.0635 ||: 87%|########7 | 97/111 [01:07<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6879, UAS: 0.8175, LAS: 0.6950, UEM: 0.2918, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0558, partial_loss/deprel_loss: 2.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3255, loss: 2.1791, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||: 91%|######### | 101/111 [01:10<00:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7525, UAS: 0.8183, LAS: 0.6962, UEM: 0.2889, LEM: 0.0938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1692, partial_loss/deprel_loss: 1.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6361, loss: 2.1703, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||: 95%|#########4| 105/111 [01:13<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6415, UAS: 0.8200, LAS: 0.6981, UEM: 0.2967, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9598, partial_loss/deprel_loss: 2.7343, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8417, loss: 2.1535, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||: 98%|#########8| 109/111 [01:15<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6768, UAS: 0.8197, LAS: 0.6979, UEM: 0.2936, LEM: 0.0948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2748, partial_loss/deprel_loss: 2.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4206, loss: 2.1574, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 2.379 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 2.275 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - reg_loss | 0.063 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UEM | 0.294 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LAS | 0.698 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - loss | 2.157 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEM | 0.095 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UAS | 0.820 | N/A\n", + "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - EM | 0.677 | N/A\n", + "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Epoch duration: 0:01:16.740242\n", + "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Estimated training time remaining: 9:06:01\n", + "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Epoch 4/399\n", + "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:55:18,236 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6673, UAS: 0.7876, LAS: 0.6728, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6651, partial_loss/deprel_loss: 2.6082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6819, loss: 2.5358, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||: 3%|2 | 3/111 [00:02<01:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5590, UAS: 0.7847, LAS: 0.6734, UEM: 0.0866, LEM: 0.0162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1240, partial_loss/deprel_loss: 3.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9583, loss: 2.5349, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||: 5%|5 | 6/111 [00:04<01:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.8104, LAS: 0.7009, UEM: 0.1961, LEM: 0.0497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6716, partial_loss/deprel_loss: 1.1607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1251, loss: 2.2299, batch_reg_loss: 0.0622, reg_loss: 0.0623 ||: 8%|8 | 9/111 [00:06<01:13, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6524, UAS: 0.8224, LAS: 0.7121, UEM: 0.2315, LEM: 0.0565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7101, partial_loss/deprel_loss: 2.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6826, loss: 2.1006, batch_reg_loss: 0.0622, reg_loss: 0.0622 ||: 12%|#1 | 13/111 [00:09<01:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.8348, LAS: 0.7248, UEM: 0.3040, LEM: 0.0847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0855, loss: 1.9659, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||: 14%|#4 | 16/111 [00:11<01:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.8448, LAS: 0.7351, UEM: 0.3447, LEM: 0.0959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1769, partial_loss/deprel_loss: 1.5892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5688, loss: 1.8513, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||: 17%|#7 | 19/111 [00:13<01:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6802, UAS: 0.8436, LAS: 0.7338, UEM: 0.3206, LEM: 0.0886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3447, partial_loss/deprel_loss: 2.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3715, loss: 1.8468, batch_reg_loss: 0.0620, reg_loss: 0.0622 ||: 21%|## | 23/111 [00:16<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6018, UAS: 0.8382, LAS: 0.7278, UEM: 0.2957, LEM: 0.0798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.6370, partial_loss/deprel_loss: 2.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1524, loss: 1.9081, batch_reg_loss: 0.0620, reg_loss: 0.0621 ||: 24%|##4 | 27/111 [00:18<00:56, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.8419, LAS: 0.7321, UEM: 0.3047, LEM: 0.0860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6244, partial_loss/deprel_loss: 1.0798, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0506, loss: 1.8696, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||: 28%|##7 | 31/111 [00:21<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6994, UAS: 0.8443, LAS: 0.7347, UEM: 0.3040, LEM: 0.0849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3267, partial_loss/deprel_loss: 2.3726, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4253, loss: 1.8526, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||: 31%|### | 34/111 [00:23<00:52, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8111, UAS: 0.8474, LAS: 0.7388, UEM: 0.3153, LEM: 0.0885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9856, loss: 1.8095, batch_reg_loss: 0.0618, reg_loss: 0.0621 ||: 33%|###3 | 37/111 [00:26<00:54, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7707, UAS: 0.8458, LAS: 0.7371, UEM: 0.3159, LEM: 0.0895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1063, partial_loss/deprel_loss: 1.5260, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5038, loss: 1.8230, batch_reg_loss: 0.0618, reg_loss: 0.0620 ||: 37%|###6 | 41/111 [00:28<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6812, UAS: 0.8369, LAS: 0.7281, UEM: 0.3046, LEM: 0.0863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4355, partial_loss/deprel_loss: 2.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5312, loss: 1.9258, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||: 41%|#### | 45/111 [00:31<00:44, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7159, UAS: 0.8362, LAS: 0.7273, UEM: 0.2977, LEM: 0.0830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6377, partial_loss/deprel_loss: 2.1209, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0860, loss: 1.9371, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||: 43%|####3 | 48/111 [00:33<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7413, UAS: 0.8332, LAS: 0.7243, UEM: 0.2893, LEM: 0.0804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3635, partial_loss/deprel_loss: 1.7896, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7661, loss: 1.9680, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||: 46%|####5 | 51/111 [00:35<00:43, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7546, UAS: 0.8368, LAS: 0.7289, UEM: 0.3044, LEM: 0.0903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4638, partial_loss/deprel_loss: 1.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6829, loss: 1.9241, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||: 50%|####9 | 55/111 [00:38<00:38, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.8378, LAS: 0.7302, UEM: 0.2995, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7480, partial_loss/deprel_loss: 1.2659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2240, loss: 1.9138, batch_reg_loss: 0.0617, reg_loss: 0.0619 ||: 53%|#####3 | 59/111 [00:40<00:35, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8413, LAS: 0.7346, UEM: 0.3580, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7434, partial_loss/deprel_loss: 2.0320, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0359, loss: 1.8734, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||: 56%|#####5 | 62/111 [00:43<00:36, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7846, UAS: 0.8430, LAS: 0.7366, UEM: 0.3472, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 1.4828, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4530, loss: 1.8528, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||: 59%|#####9 | 66/111 [00:46<00:32, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8108, UAS: 0.8447, LAS: 0.7383, UEM: 0.3415, LEM: 0.1300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7083, partial_loss/deprel_loss: 1.0955, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0797, loss: 1.8399, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||: 63%|######3 | 70/111 [00:49<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.8453, LAS: 0.7392, UEM: 0.3375, LEM: 0.1274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 1.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1661, loss: 1.8386, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||: 66%|######5 | 73/111 [00:51<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7005, UAS: 0.8452, LAS: 0.7393, UEM: 0.3279, LEM: 0.1228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2810, partial_loss/deprel_loss: 2.1734, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2565, loss: 1.8368, batch_reg_loss: 0.0615, reg_loss: 0.0619 ||: 69%|######9 | 77/111 [00:53<00:23, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6741, UAS: 0.8452, LAS: 0.7395, UEM: 0.3431, LEM: 0.1362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5383, partial_loss/deprel_loss: 2.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6622, loss: 1.8377, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||: 72%|#######2 | 80/111 [00:55<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7905, UAS: 0.8448, LAS: 0.7389, UEM: 0.3355, LEM: 0.1324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8467, partial_loss/deprel_loss: 1.3524, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 1.8435, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||: 76%|#######5 | 84/111 [00:58<00:18, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7866, UAS: 0.8450, LAS: 0.7392, UEM: 0.3311, LEM: 0.1296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9914, partial_loss/deprel_loss: 1.4335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4066, loss: 1.8406, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||: 78%|#######8 | 87/111 [01:00<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.8472, LAS: 0.7416, UEM: 0.3370, LEM: 0.1305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7954, loss: 1.8162, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||: 82%|########1 | 91/111 [01:02<00:13, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6469, UAS: 0.8463, LAS: 0.7407, UEM: 0.3336, LEM: 0.1286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0053, partial_loss/deprel_loss: 2.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5838, loss: 1.8231, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||: 85%|########4 | 94/111 [01:05<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7256, UAS: 0.8454, LAS: 0.7396, UEM: 0.3284, LEM: 0.1263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6650, partial_loss/deprel_loss: 1.9252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9346, loss: 1.8328, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||: 87%|########7 | 97/111 [01:07<00:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7599, UAS: 0.8465, LAS: 0.7407, UEM: 0.3289, LEM: 0.1240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2847, partial_loss/deprel_loss: 1.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7031, loss: 1.8239, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||: 91%|######### | 101/111 [01:09<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.8483, LAS: 0.7429, UEM: 0.3366, LEM: 0.1267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5180, partial_loss/deprel_loss: 0.8814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8701, loss: 1.8040, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||: 95%|#########4| 105/111 [01:11<00:03, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7331, UAS: 0.8486, LAS: 0.7433, UEM: 0.3357, LEM: 0.1260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9632, partial_loss/deprel_loss: 1.9598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0219, loss: 1.8012, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||: 98%|#########8| 109/111 [01:14<00:01, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.8500, LAS: 0.7451, UEM: 0.3439, LEM: 0.1293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5623, partial_loss/deprel_loss: 0.9248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9137, loss: 1.7845, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.925 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.562 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - reg_loss | 0.062 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UEM | 0.344 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LAS | 0.745 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - loss | 1.785 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEM | 0.129 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - UAS | 0.850 | N/A\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - EM | 0.835 | N/A\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Epoch duration: 0:01:15.570663\n", + "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:12\n", + "2023-04-06 22:56:33,800 - INFO - allennlp.training.trainer - Epoch 5/399\n", + "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:56:33,806 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7017, UAS: 0.8575, LAS: 0.7564, UEM: 0.2434, LEM: 0.0823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1851, partial_loss/deprel_loss: 2.1142, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1898, loss: 1.6516, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 4%|3 | 4/111 [00:02<00:55, 1.93it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8573, LAS: 0.7593, UEM: 0.1945, LEM: 0.0493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 1.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3831, loss: 1.6800, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 7%|7 | 8/111 [00:04<00:55, 1.84it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8045, UAS: 0.8581, LAS: 0.7600, UEM: 0.1996, LEM: 0.0437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7492, partial_loss/deprel_loss: 1.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1844, loss: 1.6630, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 10%|9 | 11/111 [00:06<01:00, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7124, UAS: 0.8519, LAS: 0.7533, UEM: 0.1704, LEM: 0.0371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3078, partial_loss/deprel_loss: 2.1321, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2286, loss: 1.7343, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 13%|#2 | 14/111 [00:08<01:02, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.8522, LAS: 0.7539, UEM: 0.1756, LEM: 0.0394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 1.1383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1219, loss: 1.7377, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 15%|#5 | 17/111 [00:11<01:03, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7448, UAS: 0.8579, LAS: 0.7603, UEM: 0.2127, LEM: 0.0579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5514, partial_loss/deprel_loss: 1.6989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7308, loss: 1.6711, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 18%|#8 | 20/111 [00:13<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8081, UAS: 0.8630, LAS: 0.7659, UEM: 0.2570, LEM: 0.0807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9484, partial_loss/deprel_loss: 1.1780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1934, loss: 1.6165, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 21%|## | 23/111 [00:15<01:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7710, UAS: 0.8636, LAS: 0.7669, UEM: 0.2827, LEM: 0.0951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3315, partial_loss/deprel_loss: 1.5198, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5435, loss: 1.6098, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 23%|##3 | 26/111 [00:17<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7620, UAS: 0.8608, LAS: 0.7644, UEM: 0.3072, LEM: 0.1148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3709, partial_loss/deprel_loss: 1.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5573, loss: 1.6290, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 27%|##7 | 30/111 [00:20<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.8687, LAS: 0.7732, UEM: 0.3575, LEM: 0.1333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5238, partial_loss/deprel_loss: 0.8705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 1.5422, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 31%|### | 34/111 [00:22<00:51, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6280, UAS: 0.8659, LAS: 0.7697, UEM: 0.3664, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5054, partial_loss/deprel_loss: 2.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9489, loss: 1.5726, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 34%|###4 | 38/111 [00:25<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7226, UAS: 0.8644, LAS: 0.7677, UEM: 0.3535, LEM: 0.1338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9962, partial_loss/deprel_loss: 2.0087, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0676, loss: 1.5945, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 38%|###7 | 42/111 [00:27<00:45, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7397, UAS: 0.8681, LAS: 0.7717, UEM: 0.3782, LEM: 0.1455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6230, partial_loss/deprel_loss: 1.7756, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8064, loss: 1.5545, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 41%|####1 | 46/111 [00:30<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8698, LAS: 0.7736, UEM: 0.3770, LEM: 0.1440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9417, loss: 1.5345, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 45%|####5 | 50/111 [00:33<00:41, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7631, UAS: 0.8696, LAS: 0.7733, UEM: 0.3760, LEM: 0.1438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5292, partial_loss/deprel_loss: 1.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6637, loss: 1.5373, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 48%|####7 | 53/111 [00:35<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.8706, LAS: 0.7745, UEM: 0.3732, LEM: 0.1419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0361, partial_loss/deprel_loss: 1.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3686, loss: 1.5272, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 50%|##### | 56/111 [00:37<00:38, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.8725, LAS: 0.7769, UEM: 0.3885, LEM: 0.1536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 1.0568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0458, loss: 1.5054, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 53%|#####3 | 59/111 [00:39<00:36, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.8729, LAS: 0.7771, UEM: 0.3914, LEM: 0.1520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6869, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0979, loss: 1.5056, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 56%|#####5 | 62/111 [00:42<00:34, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7123, UAS: 0.8726, LAS: 0.7767, UEM: 0.3847, LEM: 0.1476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1384, partial_loss/deprel_loss: 1.9929, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0833, loss: 1.5100, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 59%|#####8 | 65/111 [00:44<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.8741, LAS: 0.7786, UEM: 0.4104, LEM: 0.1780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1555, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 1.4902, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 61%|######1 | 68/111 [00:46<00:31, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6839, UAS: 0.8727, LAS: 0.7774, UEM: 0.4028, LEM: 0.1735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6867, partial_loss/deprel_loss: 2.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4223, loss: 1.4995, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 64%|######3 | 71/111 [00:48<00:28, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.8714, LAS: 0.7764, UEM: 0.3971, LEM: 0.1677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 1.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 1.5104, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 68%|######7 | 75/111 [00:51<00:24, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6175, UAS: 0.8696, LAS: 0.7746, UEM: 0.3921, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8233, partial_loss/deprel_loss: 2.8003, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0663, loss: 1.5301, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 71%|#######1 | 79/111 [00:53<00:20, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.8661, LAS: 0.7709, UEM: 0.3842, LEM: 0.1610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5925, partial_loss/deprel_loss: 1.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8223, loss: 1.5739, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 75%|#######4 | 83/111 [00:55<00:18, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.8666, LAS: 0.7714, UEM: 0.3769, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5992, partial_loss/deprel_loss: 1.6861, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7301, loss: 1.5698, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||: 78%|#######8 | 87/111 [00:58<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6880, UAS: 0.8660, LAS: 0.7708, UEM: 0.3766, LEM: 0.1560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6133, partial_loss/deprel_loss: 2.1378, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2944, loss: 1.5744, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||: 81%|########1 | 90/111 [01:01<00:15, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7145, UAS: 0.8654, LAS: 0.7703, UEM: 0.3729, LEM: 0.1542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3646, partial_loss/deprel_loss: 2.0728, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1926, loss: 1.5798, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||: 84%|########3 | 93/111 [01:03<00:13, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7754, UAS: 0.8652, LAS: 0.7702, UEM: 0.3709, LEM: 0.1526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2314, partial_loss/deprel_loss: 1.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5543, loss: 1.5834, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||: 86%|########6 | 96/111 [01:05<00:10, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7925, UAS: 0.8642, LAS: 0.7695, UEM: 0.3719, LEM: 0.1529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1520, partial_loss/deprel_loss: 1.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3735, loss: 1.5922, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||: 89%|########9 | 99/111 [01:08<00:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6972, UAS: 0.8644, LAS: 0.7697, UEM: 0.3691, LEM: 0.1504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3335, partial_loss/deprel_loss: 2.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3058, loss: 1.5920, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||: 93%|#########2| 103/111 [01:10<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.8655, LAS: 0.7711, UEM: 0.3800, LEM: 0.1593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.5589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 1.5770, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||: 95%|#########5| 106/111 [01:12<00:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7927, UAS: 0.8653, LAS: 0.7706, UEM: 0.3763, LEM: 0.1567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9309, partial_loss/deprel_loss: 1.2968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||: 98%|#########8| 109/111 [01:14<00:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8018, UAS: 0.8655, LAS: 0.7708, UEM: 0.3731, LEM: 0.1547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8911, partial_loss/deprel_loss: 1.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2913, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-06 22:57:49,583 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.9041, LAS: 0.8223, UEM: 0.3590, LEM: 0.0897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9126, partial_loss/deprel_loss: 32.0601, partial_loss/cycle_loss: 0.0000, batch_loss: 25.8306, loss: 27.0349, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9214, LAS: 0.8453, UEM: 0.5769, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 16.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 13.2159, loss: 21.8993, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7466, UAS: 0.9121, LAS: 0.8362, UEM: 0.5609, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1975, partial_loss/deprel_loss: 54.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 44.0925, loss: 25.0782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9151, LAS: 0.8387, UEM: 0.5397, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 22.6314, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2327, loss: 23.8980, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9130, LAS: 0.8361, UEM: 0.5198, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3525, partial_loss/deprel_loss: 34.6234, partial_loss/cycle_loss: 0.0000, batch_loss: 27.9692, loss: 24.2112, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.05it/s]\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.314 | 34.623\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.891 | 1.353\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - reg_loss | 0.061 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UEM | 0.373 | 0.520\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LAS | 0.771 | 0.836\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - loss | 1.581 | 24.211\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEM | 0.155 | 0.255\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UAS | 0.866 | 0.913\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EM | 0.802 | 0.805\n", + "2023-04-06 22:58:01,931 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Epoch duration: 0:01:28.130781\n", + "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Estimated training time remaining: 9:01:20\n", + "2023-04-06 22:58:01,931 - INFO - allennlp.training.trainer - Epoch 6/399\n", + "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:58:01,939 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7928, UAS: 0.8946, LAS: 0.8032, UEM: 0.3837, LEM: 0.1392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9781, partial_loss/deprel_loss: 1.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3320, loss: 1.3132, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||: 3%|2 | 3/111 [00:02<01:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8970, LAS: 0.8065, UEM: 0.4021, LEM: 0.1350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.9386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9268, loss: 1.2471, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||: 5%|5 | 6/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.8897, LAS: 0.7999, UEM: 0.3630, LEM: 0.1180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9064, partial_loss/deprel_loss: 1.2405, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2353, loss: 1.3079, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||: 9%|9 | 10/111 [00:06<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7893, UAS: 0.8751, LAS: 0.7831, UEM: 0.3085, LEM: 0.0989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1124, partial_loss/deprel_loss: 1.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4348, loss: 1.4786, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||: 13%|#2 | 14/111 [00:08<01:02, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.8743, LAS: 0.7827, UEM: 0.3527, LEM: 0.1199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4962, partial_loss/deprel_loss: 0.8334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8276, loss: 1.4829, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||: 15%|#5 | 17/111 [00:11<01:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6250, UAS: 0.8694, LAS: 0.7787, UEM: 0.3480, LEM: 0.1177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1969, partial_loss/deprel_loss: 2.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1564, loss: 1.5361, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||: 19%|#8 | 21/111 [00:13<01:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7569, UAS: 0.8693, LAS: 0.7786, UEM: 0.3166, LEM: 0.1037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5271, partial_loss/deprel_loss: 1.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8167, loss: 1.5297, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||: 23%|##2 | 25/111 [00:16<00:56, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.8677, LAS: 0.7759, UEM: 0.3006, LEM: 0.0945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3811, partial_loss/deprel_loss: 2.0258, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1586, loss: 1.5526, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||: 26%|##6 | 29/111 [00:18<00:53, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8672, LAS: 0.7753, UEM: 0.3126, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0218, partial_loss/deprel_loss: 1.8331, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9327, loss: 1.5604, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||: 30%|##9 | 33/111 [00:21<00:50, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7770, UAS: 0.8695, LAS: 0.7770, UEM: 0.3171, LEM: 0.1003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 1.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4899, loss: 1.5471, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||: 33%|###3 | 37/111 [00:23<00:46, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7841, UAS: 0.8650, LAS: 0.7722, UEM: 0.3010, LEM: 0.0950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2401, partial_loss/deprel_loss: 1.4031, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4324, loss: 1.6028, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||: 37%|###6 | 41/111 [00:26<00:42, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.8680, LAS: 0.7754, UEM: 0.3355, LEM: 0.1209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 1.5741, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||: 41%|#### | 45/111 [00:29<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.8696, LAS: 0.7771, UEM: 0.3369, LEM: 0.1205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6923, partial_loss/deprel_loss: 1.0521, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0421, loss: 1.5538, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||: 44%|####4 | 49/111 [00:31<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7539, UAS: 0.8692, LAS: 0.7765, UEM: 0.3256, LEM: 0.1145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6915, partial_loss/deprel_loss: 1.8414, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8734, loss: 1.5572, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||: 48%|####7 | 53/111 [00:34<00:38, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.8703, LAS: 0.7782, UEM: 0.3360, LEM: 0.1201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9074, loss: 1.5379, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||: 51%|#####1 | 57/111 [00:37<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8717, LAS: 0.7799, UEM: 0.3610, LEM: 0.1445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9092, partial_loss/deprel_loss: 1.1890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1951, loss: 1.5218, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||: 54%|#####4 | 60/111 [00:39<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8035, UAS: 0.8727, LAS: 0.7813, UEM: 0.3561, LEM: 0.1403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1905, partial_loss/deprel_loss: 1.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2980, loss: 1.5067, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||: 57%|#####6 | 63/111 [00:42<00:34, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.8749, LAS: 0.7839, UEM: 0.3711, LEM: 0.1484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.6615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 1.4817, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||: 59%|#####9 | 66/111 [00:44<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.8736, LAS: 0.7826, UEM: 0.3745, LEM: 0.1515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5556, partial_loss/deprel_loss: 1.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6555, loss: 1.4939, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||: 63%|######3 | 70/111 [00:46<00:28, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.8744, LAS: 0.7837, UEM: 0.3851, LEM: 0.1595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.6582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6565, loss: 1.4852, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||: 66%|######5 | 73/111 [00:50<00:34, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8754, LAS: 0.7846, UEM: 0.3853, LEM: 0.1580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8573, partial_loss/deprel_loss: 1.2353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 1.4768, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||: 68%|######8 | 76/111 [00:53<00:31, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.8775, LAS: 0.7871, UEM: 0.4008, LEM: 0.1662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8025, loss: 1.4523, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||: 71%|#######1 | 79/111 [00:55<00:27, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8768, LAS: 0.7867, UEM: 0.4232, LEM: 0.1931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3685, partial_loss/deprel_loss: 1.5348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5637, loss: 1.4562, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||: 74%|#######3 | 82/111 [00:58<00:24, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7120, UAS: 0.8759, LAS: 0.7859, UEM: 0.4157, LEM: 0.1885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3845, partial_loss/deprel_loss: 2.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1642, loss: 1.4645, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||: 77%|#######7 | 86/111 [01:00<00:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8155, UAS: 0.8760, LAS: 0.7861, UEM: 0.4115, LEM: 0.1853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8067, partial_loss/deprel_loss: 1.1319, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1291, loss: 1.4605, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||: 80%|######## | 89/111 [01:02<00:16, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7328, UAS: 0.8753, LAS: 0.7855, UEM: 0.4026, LEM: 0.1804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2779, partial_loss/deprel_loss: 1.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0508, loss: 1.4669, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||: 84%|########3 | 93/111 [01:04<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8328, UAS: 0.8765, LAS: 0.7868, UEM: 0.4051, LEM: 0.1809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 1.0645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0804, loss: 1.4538, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||: 86%|########6 | 96/111 [01:06<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8406, UAS: 0.8762, LAS: 0.7865, UEM: 0.4014, LEM: 0.1783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5521, partial_loss/deprel_loss: 0.9905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.4581, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||: 89%|########9 | 99/111 [01:09<00:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7715, UAS: 0.8767, LAS: 0.7872, UEM: 0.3993, LEM: 0.1761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3737, partial_loss/deprel_loss: 1.5367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5665, loss: 1.4511, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||: 92%|#########1| 102/111 [01:11<00:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7680, UAS: 0.8764, LAS: 0.7870, UEM: 0.3919, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6444, loss: 1.4537, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||: 95%|#########5| 106/111 [01:13<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.8768, LAS: 0.7875, UEM: 0.3925, LEM: 0.1722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 1.4500, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||: 98%|#########8| 109/111 [01:15<00:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.8776, LAS: 0.7883, UEM: 0.3955, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9031, partial_loss/deprel_loss: 1.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2433, loss: 1.4419, batch_reg_loss: 0.0625, reg_loss: 0.0620 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.250 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.903 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - reg_loss | 0.062 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UEM | 0.395 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - LAS | 0.788 | N/A\n", + "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - loss | 1.442 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEM | 0.174 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - UAS | 0.878 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EM | 0.812 | N/A\n", + "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Epoch duration: 0:01:17.422262\n", + "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:16\n", + "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Epoch 7/399\n", + "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 22:59:19,361 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.8724, LAS: 0.7842, UEM: 0.3680, LEM: 0.1364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4368, partial_loss/deprel_loss: 0.7830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7763, loss: 1.4874, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||: 4%|3 | 4/111 [00:02<01:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7297, UAS: 0.8701, LAS: 0.7828, UEM: 0.4033, LEM: 0.1768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0957, partial_loss/deprel_loss: 1.9928, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0759, loss: 1.5090, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||: 6%|6 | 7/111 [00:05<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7719, UAS: 0.8774, LAS: 0.7933, UEM: 0.3826, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.6923, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7077, loss: 1.4414, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||: 10%|9 | 11/111 [00:07<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8024, UAS: 0.8787, LAS: 0.7934, UEM: 0.3521, LEM: 0.1407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 1.2649, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 1.4205, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||: 14%|#3 | 15/111 [00:09<01:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7615, UAS: 0.8748, LAS: 0.7881, UEM: 0.3135, LEM: 0.1196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6249, partial_loss/deprel_loss: 1.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7141, loss: 1.4666, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||: 17%|#7 | 19/111 [00:12<00:58, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.8822, LAS: 0.7962, UEM: 0.3660, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6126, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9508, loss: 1.3872, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||: 20%|#9 | 22/111 [00:14<00:58, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6689, UAS: 0.8766, LAS: 0.7911, UEM: 0.3612, LEM: 0.1459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2741, partial_loss/deprel_loss: 2.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6488, loss: 1.4397, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||: 23%|##3 | 26/111 [00:16<00:53, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.8769, LAS: 0.7922, UEM: 0.3532, LEM: 0.1394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9310, loss: 1.4379, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||: 27%|##7 | 30/111 [00:19<00:51, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.8768, LAS: 0.7918, UEM: 0.3561, LEM: 0.1370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8156, loss: 1.4428, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||: 31%|### | 34/111 [00:21<00:49, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7718, UAS: 0.8759, LAS: 0.7906, UEM: 0.3526, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3521, partial_loss/deprel_loss: 1.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5261, loss: 1.4532, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||: 34%|###4 | 38/111 [00:24<00:47, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7682, UAS: 0.8763, LAS: 0.7911, UEM: 0.3421, LEM: 0.1291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5765, partial_loss/deprel_loss: 1.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6931, loss: 1.4514, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||: 38%|###7 | 42/111 [00:27<00:45, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.8781, LAS: 0.7929, UEM: 0.3316, LEM: 0.1220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 1.1158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0980, loss: 1.4348, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||: 41%|####1 | 46/111 [00:29<00:40, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7495, UAS: 0.8762, LAS: 0.7916, UEM: 0.3351, LEM: 0.1242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0049, partial_loss/deprel_loss: 1.8432, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9386, loss: 1.4529, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||: 45%|####5 | 50/111 [00:31<00:37, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7735, UAS: 0.8790, LAS: 0.7953, UEM: 0.3877, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4529, partial_loss/deprel_loss: 1.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5387, loss: 1.4166, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||: 49%|####8 | 54/111 [00:35<00:39, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8136, UAS: 0.8792, LAS: 0.7954, UEM: 0.3826, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9952, partial_loss/deprel_loss: 1.2018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2236, loss: 1.4151, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||: 51%|#####1 | 57/111 [00:37<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7092, UAS: 0.8797, LAS: 0.7962, UEM: 0.4184, LEM: 0.2082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7240, partial_loss/deprel_loss: 2.1644, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3395, loss: 1.4103, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||: 54%|#####4 | 60/111 [00:39<00:36, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7540, UAS: 0.8799, LAS: 0.7961, UEM: 0.4070, LEM: 0.1991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8092, partial_loss/deprel_loss: 1.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7963, loss: 1.4121, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||: 58%|#####7 | 64/111 [00:42<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.8805, LAS: 0.7967, UEM: 0.4083, LEM: 0.2006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9000, partial_loss/deprel_loss: 1.1946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1989, loss: 1.4027, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||: 60%|###### | 67/111 [00:44<00:30, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.8815, LAS: 0.7979, UEM: 0.4116, LEM: 0.2017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6882, partial_loss/deprel_loss: 0.9346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9486, loss: 1.3897, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||: 63%|######3 | 70/111 [00:46<00:30, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.8812, LAS: 0.7976, UEM: 0.4122, LEM: 0.2035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 1.3910, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||: 66%|######5 | 73/111 [00:48<00:27, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8465, UAS: 0.8816, LAS: 0.7982, UEM: 0.4122, LEM: 0.2019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9186, loss: 1.3860, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||: 68%|######8 | 76/111 [00:50<00:25, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7487, UAS: 0.8817, LAS: 0.7982, UEM: 0.4104, LEM: 0.1998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8556, partial_loss/deprel_loss: 1.6892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7859, loss: 1.3852, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||: 71%|#######1 | 79/111 [00:53<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8828, LAS: 0.7995, UEM: 0.4079, LEM: 0.1960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8511, partial_loss/deprel_loss: 1.1586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1606, loss: 1.3738, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||: 74%|#######3 | 82/111 [00:55<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8831, LAS: 0.7998, UEM: 0.3986, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2809, partial_loss/deprel_loss: 1.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4682, loss: 1.3714, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||: 77%|#######7 | 86/111 [00:57<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.8841, LAS: 0.8011, UEM: 0.4051, LEM: 0.1932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 1.3591, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||: 80%|######## | 89/111 [00:59<00:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8384, UAS: 0.8851, LAS: 0.8022, UEM: 0.4059, LEM: 0.1904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7558, partial_loss/deprel_loss: 0.8878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9250, loss: 1.3475, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||: 83%|########2 | 92/111 [01:01<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6849, UAS: 0.8847, LAS: 0.8021, UEM: 0.4073, LEM: 0.1900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0226, partial_loss/deprel_loss: 2.1493, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3876, loss: 1.3458, batch_reg_loss: 0.0637, reg_loss: 0.0630 ||: 86%|########6 | 96/111 [01:04<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8834, LAS: 0.8006, UEM: 0.4017, LEM: 0.1872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0285, partial_loss/deprel_loss: 1.8749, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9693, loss: 1.3587, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||: 89%|########9 | 99/111 [01:06<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8169, UAS: 0.8834, LAS: 0.8005, UEM: 0.4020, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8733, partial_loss/deprel_loss: 1.1504, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1587, loss: 1.3588, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||: 92%|#########1| 102/111 [01:09<00:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.8850, LAS: 0.8022, UEM: 0.4122, LEM: 0.1905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.6209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 1.3414, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||: 95%|#########5| 106/111 [01:11<00:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.8857, LAS: 0.8029, UEM: 0.4147, LEM: 0.1914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4652, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7900, loss: 1.3339, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||: 98%|#########8| 109/111 [01:13<00:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.8854, LAS: 0.8026, UEM: 0.4124, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8597, partial_loss/deprel_loss: 0.9947, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0315, loss: 1.3354, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||: 100%|##########| 111/111 [01:15<00:00, 1.48it/s]\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.995 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.860 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - reg_loss | 0.063 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UEM | 0.412 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - LAS | 0.803 | N/A\n", + "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - loss | 1.335 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEM | 0.190 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - UAS | 0.885 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EM | 0.827 | N/A\n", + "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Epoch duration: 0:01:15.022627\n", + "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Estimated training time remaining: 8:48:26\n", + "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Epoch 8/399\n", + "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:00:34,384 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8241, UAS: 0.8930, LAS: 0.8071, UEM: 0.2937, LEM: 0.0688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8920, partial_loss/deprel_loss: 1.0848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1101, loss: 1.2838, batch_reg_loss: 0.0639, reg_loss: 0.0639 ||: 4%|3 | 4/111 [00:02<01:05, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.8886, LAS: 0.8066, UEM: 0.3058, LEM: 0.0816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9010, partial_loss/deprel_loss: 1.1552, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1683, loss: 1.2793, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||: 7%|7 | 8/111 [00:04<01:03, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9018, LAS: 0.8220, UEM: 0.5010, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1971, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 1.1506, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||: 10%|9 | 11/111 [00:07<01:03, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.8885, LAS: 0.8093, UEM: 0.5000, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 0.6960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 1.3050, batch_reg_loss: 0.0640, reg_loss: 0.0640 ||: 13%|#2 | 14/111 [00:09<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.8872, LAS: 0.8077, UEM: 0.4793, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.7968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 1.3102, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||: 15%|#5 | 17/111 [00:11<01:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7552, UAS: 0.8892, LAS: 0.8111, UEM: 0.4579, LEM: 0.2212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8160, partial_loss/deprel_loss: 1.5796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6910, loss: 1.2699, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||: 19%|#8 | 21/111 [00:14<01:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8090, UAS: 0.8856, LAS: 0.8065, UEM: 0.4306, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1190, partial_loss/deprel_loss: 1.1705, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2244, loss: 1.3033, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||: 22%|##1 | 24/111 [00:16<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7897, UAS: 0.8861, LAS: 0.8069, UEM: 0.4112, LEM: 0.1927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2958, partial_loss/deprel_loss: 1.3087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3704, loss: 1.2958, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||: 24%|##4 | 27/111 [00:18<01:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8839, LAS: 0.8044, UEM: 0.4072, LEM: 0.1892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4421, partial_loss/deprel_loss: 1.8969, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0702, loss: 1.3262, batch_reg_loss: 0.0643, reg_loss: 0.0641 ||: 27%|##7 | 30/111 [00:20<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.8813, LAS: 0.8011, UEM: 0.3874, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 1.1863, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1903, loss: 1.3609, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||: 31%|### | 34/111 [00:23<00:53, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.8837, LAS: 0.8038, UEM: 0.4387, LEM: 0.2372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1111, partial_loss/deprel_loss: 1.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3019, loss: 1.3366, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||: 33%|###3 | 37/111 [00:25<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8854, LAS: 0.8050, UEM: 0.4272, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3545, partial_loss/deprel_loss: 1.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5214, loss: 1.3286, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||: 36%|###6 | 40/111 [00:27<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.8877, LAS: 0.8072, UEM: 0.4217, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5300, partial_loss/deprel_loss: 0.9049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8945, loss: 1.3072, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||: 39%|###8 | 43/111 [00:29<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.8908, LAS: 0.8105, UEM: 0.4339, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5897, partial_loss/deprel_loss: 0.8662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8754, loss: 1.2774, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||: 41%|####1 | 46/111 [00:32<00:47, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.8909, LAS: 0.8105, UEM: 0.4243, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8100, partial_loss/deprel_loss: 0.9878, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 1.2768, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||: 44%|####4 | 49/111 [00:34<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4112, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9683, loss: 1.2818, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||: 48%|####7 | 53/111 [00:36<00:39, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4056, LEM: 0.1924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6974, partial_loss/deprel_loss: 0.9227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9424, loss: 1.2799, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.8911, LAS: 0.8107, UEM: 0.4065, LEM: 0.1909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7933, partial_loss/deprel_loss: 0.9271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.2707, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||: 54%|#####4 | 60/111 [00:41<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8913, LAS: 0.8110, UEM: 0.4163, LEM: 0.1957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5222, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8501, loss: 1.2691, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||: 57%|#####6 | 63/111 [00:43<00:33, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.8926, LAS: 0.8125, UEM: 0.4278, LEM: 0.2061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 1.0206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0312, loss: 1.2552, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||: 59%|#####9 | 66/111 [00:45<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.8931, LAS: 0.8132, UEM: 0.4331, LEM: 0.2078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1884, partial_loss/deprel_loss: 1.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3227, loss: 1.2490, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||: 63%|######3 | 70/111 [00:48<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7758, UAS: 0.8925, LAS: 0.8121, UEM: 0.4233, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6001, loss: 1.2582, batch_reg_loss: 0.0650, reg_loss: 0.0644 ||: 67%|######6 | 74/111 [00:50<00:24, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.8917, LAS: 0.8114, UEM: 0.4194, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5735, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8643, loss: 1.2660, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||: 70%|####### | 78/111 [00:53<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.8931, LAS: 0.8129, UEM: 0.4242, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.7510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7497, loss: 1.2519, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||: 73%|#######2 | 81/111 [00:55<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6999, UAS: 0.8912, LAS: 0.8106, UEM: 0.4176, LEM: 0.1948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5586, partial_loss/deprel_loss: 2.1598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3047, loss: 1.2725, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||: 76%|#######5 | 84/111 [00:57<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7984, UAS: 0.8920, LAS: 0.8114, UEM: 0.4254, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2174, partial_loss/deprel_loss: 1.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4084, loss: 1.2663, batch_reg_loss: 0.0652, reg_loss: 0.0645 ||: 79%|#######9 | 88/111 [01:00<00:15, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7645, UAS: 0.8914, LAS: 0.8106, UEM: 0.4171, LEM: 0.1945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7351, partial_loss/deprel_loss: 1.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7596, loss: 1.2742, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||: 83%|########2 | 92/111 [01:02<00:12, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.8916, LAS: 0.8109, UEM: 0.4169, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4136, partial_loss/deprel_loss: 0.6496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6677, loss: 1.2720, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||: 86%|########6 | 96/111 [01:05<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.8930, LAS: 0.8124, UEM: 0.4280, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4469, partial_loss/deprel_loss: 0.7590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 1.2586, batch_reg_loss: 0.0654, reg_loss: 0.0646 ||: 89%|########9 | 99/111 [01:08<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7769, UAS: 0.8935, LAS: 0.8130, UEM: 0.4298, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6781, partial_loss/deprel_loss: 1.5453, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6373, loss: 1.2527, batch_reg_loss: 0.0655, reg_loss: 0.0646 ||: 92%|#########1| 102/111 [01:10<00:06, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6829, UAS: 0.8911, LAS: 0.8105, UEM: 0.4258, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1513, partial_loss/deprel_loss: 2.1113, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3848, loss: 1.2753, batch_reg_loss: 0.0655, reg_loss: 0.0647 ||: 95%|#########4| 105/111 [01:13<00:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7566, UAS: 0.8903, LAS: 0.8095, UEM: 0.4247, LEM: 0.1967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8494, partial_loss/deprel_loss: 1.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8367, loss: 1.2862, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||: 97%|#########7| 108/111 [01:15<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.8911, LAS: 0.8104, UEM: 0.4280, LEM: 0.1988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 1.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0965, loss: 1.2771, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||: 100%|##########| 111/111 [01:16<00:00, 1.44it/s]\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.100 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.755 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - reg_loss | 0.065 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UEM | 0.428 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LAS | 0.810 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - loss | 1.277 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2424.097 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEM | 0.199 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UAS | 0.891 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EM | 0.828 | N/A\n", + "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Epoch duration: 0:01:16.982102\n", + "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Estimated training time remaining: 8:44:16\n", + "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Epoch 9/399\n", + "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:01:51,366 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9255, LAS: 0.8548, UEM: 0.5504, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4220, partial_loss/deprel_loss: 0.6260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8275, batch_reg_loss: 0.0656, reg_loss: 0.0656 ||: 3%|2 | 3/111 [00:02<01:21, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9245, LAS: 0.8515, UEM: 0.5266, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.9576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8760, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||: 5%|5 | 6/111 [00:04<01:20, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9161, LAS: 0.8419, UEM: 0.4940, LEM: 0.2270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8656, partial_loss/deprel_loss: 1.0827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9815, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||: 8%|8 | 9/111 [00:06<01:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9148, LAS: 0.8396, UEM: 0.4936, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.7863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7874, loss: 1.0120, batch_reg_loss: 0.0658, reg_loss: 0.0657 ||: 11%|# | 12/111 [00:09<01:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7472, UAS: 0.9118, LAS: 0.8363, UEM: 0.4936, LEM: 0.2092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1431, partial_loss/deprel_loss: 1.7409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8873, loss: 1.0389, batch_reg_loss: 0.0659, reg_loss: 0.0657 ||: 14%|#4 | 16/111 [00:11<01:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9033, LAS: 0.8265, UEM: 0.4604, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 1.1324, batch_reg_loss: 0.0659, reg_loss: 0.0658 ||: 18%|#8 | 20/111 [00:13<01:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8059, UAS: 0.9014, LAS: 0.8239, UEM: 0.4295, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1199, partial_loss/deprel_loss: 1.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4550, loss: 1.1575, batch_reg_loss: 0.0660, reg_loss: 0.0658 ||: 22%|##1 | 24/111 [00:16<00:57, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7750, UAS: 0.8952, LAS: 0.8171, UEM: 0.4111, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6847, partial_loss/deprel_loss: 1.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6177, loss: 1.2197, batch_reg_loss: 0.0661, reg_loss: 0.0658 ||: 25%|##5 | 28/111 [00:18<00:52, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.8923, LAS: 0.8137, UEM: 0.3953, LEM: 0.1563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2574, partial_loss/deprel_loss: 1.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9746, loss: 1.2571, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||: 29%|##8 | 32/111 [00:21<00:50, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.8916, LAS: 0.8133, UEM: 0.3940, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5520, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7862, loss: 1.2609, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||: 32%|###2 | 36/111 [00:23<00:48, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8140, UAS: 0.8902, LAS: 0.8114, UEM: 0.3764, LEM: 0.1479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1807, partial_loss/deprel_loss: 1.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2734, loss: 1.2838, batch_reg_loss: 0.0663, reg_loss: 0.0660 ||: 36%|###6 | 40/111 [00:26<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.8915, LAS: 0.8126, UEM: 0.4016, LEM: 0.1669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 1.2723, batch_reg_loss: 0.0664, reg_loss: 0.0660 ||: 40%|###9 | 44/111 [00:29<00:43, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8098, UAS: 0.8917, LAS: 0.8122, UEM: 0.3866, LEM: 0.1573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9682, partial_loss/deprel_loss: 1.2962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2971, loss: 1.2742, batch_reg_loss: 0.0665, reg_loss: 0.0660 ||: 43%|####3 | 48/111 [00:31<00:41, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8915, LAS: 0.8119, UEM: 0.3734, LEM: 0.1493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 1.0904, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1112, loss: 1.2763, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||: 47%|####6 | 52/111 [00:34<00:39, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.8937, LAS: 0.8143, UEM: 0.3817, LEM: 0.1525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8274, partial_loss/deprel_loss: 0.9894, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0237, loss: 1.2510, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||: 50%|##### | 56/111 [00:37<00:37, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7726, UAS: 0.8911, LAS: 0.8114, UEM: 0.3731, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7883, partial_loss/deprel_loss: 1.6515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7456, loss: 1.2778, batch_reg_loss: 0.0667, reg_loss: 0.0661 ||: 53%|#####3 | 59/111 [00:39<00:35, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8919, LAS: 0.8123, UEM: 0.3775, LEM: 0.1503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6848, loss: 1.2680, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||: 57%|#####6 | 63/111 [00:42<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.8923, LAS: 0.8129, UEM: 0.3800, LEM: 0.1507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3847, partial_loss/deprel_loss: 0.6543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6672, loss: 1.2614, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||: 60%|###### | 67/111 [00:45<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.8945, LAS: 0.8153, UEM: 0.3887, LEM: 0.1545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4404, partial_loss/deprel_loss: 0.7233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7337, loss: 1.2393, batch_reg_loss: 0.0669, reg_loss: 0.0663 ||: 64%|######3 | 71/111 [00:47<00:27, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8122, UAS: 0.8962, LAS: 0.8173, UEM: 0.4219, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 1.3085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3088, loss: 1.2234, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||: 67%|######6 | 74/111 [00:50<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.8964, LAS: 0.8179, UEM: 0.4236, LEM: 0.1933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5015, partial_loss/deprel_loss: 1.4831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5538, loss: 1.2192, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||: 69%|######9 | 77/111 [00:52<00:24, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8175, UAS: 0.8970, LAS: 0.8187, UEM: 0.4197, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0788, partial_loss/deprel_loss: 1.1409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1956, loss: 1.2138, batch_reg_loss: 0.0671, reg_loss: 0.0663 ||: 73%|#######2 | 81/111 [00:54<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.8961, LAS: 0.8179, UEM: 0.4136, LEM: 0.1848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7436, partial_loss/deprel_loss: 0.8710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9127, loss: 1.2214, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||: 77%|#######6 | 85/111 [00:57<00:17, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7341, UAS: 0.8956, LAS: 0.8174, UEM: 0.4083, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 1.8813, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0237, loss: 1.2272, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||: 80%|######## | 89/111 [00:59<00:14, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.8969, LAS: 0.8191, UEM: 0.4323, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2403, partial_loss/deprel_loss: 0.5870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 1.2123, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||: 84%|########3 | 93/111 [01:02<00:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7063, UAS: 0.8948, LAS: 0.8169, UEM: 0.4339, LEM: 0.2011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6918, partial_loss/deprel_loss: 2.1989, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3648, loss: 1.2362, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||: 86%|########6 | 96/111 [01:05<00:10, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.8947, LAS: 0.8168, UEM: 0.4295, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0917, partial_loss/deprel_loss: 1.1721, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2234, loss: 1.2352, batch_reg_loss: 0.0674, reg_loss: 0.0665 ||: 89%|########9 | 99/111 [01:07<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8250, UAS: 0.8951, LAS: 0.8172, UEM: 0.4260, LEM: 0.1936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 1.0274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0777, loss: 1.2291, batch_reg_loss: 0.0675, reg_loss: 0.0665 ||: 93%|#########2| 103/111 [01:10<00:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8082, UAS: 0.8962, LAS: 0.8186, UEM: 0.4419, LEM: 0.2084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1479, partial_loss/deprel_loss: 1.1772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2388, loss: 1.2158, batch_reg_loss: 0.0675, reg_loss: 0.0666 ||: 95%|#########5| 106/111 [01:12<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8127, UAS: 0.8962, LAS: 0.8185, UEM: 0.4424, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 1.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2520, loss: 1.2173, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||: 99%|#########9| 110/111 [01:14<00:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7871, UAS: 0.8960, LAS: 0.8182, UEM: 0.4402, LEM: 0.2085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3663, partial_loss/deprel_loss: 1.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 1.2197, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||: 100%|##########| 111/111 [01:15<00:00, 1.48it/s]\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.419 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.366 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - reg_loss | 0.067 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - UEM | 0.440 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LAS | 0.818 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - loss | 1.220 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEM | 0.209 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - UAS | 0.896 | N/A\n", + "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - EM | 0.787 | N/A\n", + "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:03:06,511 - INFO - combo.training.trainer - Epoch duration: 0:01:15.152380\n", + "2023-04-06 23:03:06,512 - INFO - combo.training.trainer - Estimated training time remaining: 8:39:28\n", + "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Epoch 10/399\n", + "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:03:06,518 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9211, LAS: 0.8489, UEM: 0.4350, LEM: 0.1673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6806, partial_loss/deprel_loss: 0.8446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.9582, batch_reg_loss: 0.0677, reg_loss: 0.0676 ||: 3%|2 | 3/111 [00:02<01:13, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7567, UAS: 0.9095, LAS: 0.8358, UEM: 0.3786, LEM: 0.1376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0075, partial_loss/deprel_loss: 1.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7939, loss: 1.0705, batch_reg_loss: 0.0677, reg_loss: 0.0677 ||: 6%|6 | 7/111 [00:04<01:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9037, LAS: 0.8297, UEM: 0.4104, LEM: 0.1799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4051, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6359, loss: 1.1128, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||: 9%|9 | 10/111 [00:06<01:06, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9057, LAS: 0.8309, UEM: 0.3985, LEM: 0.1653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1594, partial_loss/deprel_loss: 1.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4470, loss: 1.1057, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||: 12%|#1 | 13/111 [00:08<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7768, UAS: 0.8954, LAS: 0.8210, UEM: 0.3798, LEM: 0.1587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8156, partial_loss/deprel_loss: 1.4734, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6097, loss: 1.1918, batch_reg_loss: 0.0679, reg_loss: 0.0678 ||: 14%|#4 | 16/111 [00:10<01:05, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9001, LAS: 0.8265, UEM: 0.3925, LEM: 0.1602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.6757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 1.1418, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||: 18%|#8 | 20/111 [00:13<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9033, LAS: 0.8293, UEM: 0.4103, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8599, loss: 1.1190, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||: 21%|## | 23/111 [00:15<00:59, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7607, UAS: 0.9003, LAS: 0.8257, UEM: 0.3788, LEM: 0.1528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9901, partial_loss/deprel_loss: 1.5372, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6959, loss: 1.1511, batch_reg_loss: 0.0681, reg_loss: 0.0679 ||: 25%|##5 | 28/111 [00:17<00:50, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9034, LAS: 0.8289, UEM: 0.3855, LEM: 0.1509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7388, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0516, loss: 1.1226, batch_reg_loss: 0.0682, reg_loss: 0.0679 ||: 29%|##8 | 32/111 [00:20<00:51, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9063, LAS: 0.8325, UEM: 0.4192, LEM: 0.1846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3700, partial_loss/deprel_loss: 0.6140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 1.0953, batch_reg_loss: 0.0683, reg_loss: 0.0679 ||: 32%|###2 | 36/111 [00:23<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9079, LAS: 0.8343, UEM: 0.4254, LEM: 0.1857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4378, partial_loss/deprel_loss: 0.7192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7312, loss: 1.0799, batch_reg_loss: 0.0683, reg_loss: 0.0680 ||: 35%|###5 | 39/111 [00:25<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9090, LAS: 0.8357, UEM: 0.4734, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5374, partial_loss/deprel_loss: 0.8689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 1.0719, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||: 38%|###7 | 42/111 [00:28<00:52, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9110, LAS: 0.8381, UEM: 0.4946, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.8453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8644, loss: 1.0472, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||: 41%|#### | 45/111 [00:31<00:51, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9084, LAS: 0.8351, UEM: 0.4845, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9251, loss: 1.0728, batch_reg_loss: 0.0685, reg_loss: 0.0680 ||: 43%|####3 | 48/111 [00:33<00:48, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8088, UAS: 0.9075, LAS: 0.8338, UEM: 0.4736, LEM: 0.2393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1152, partial_loss/deprel_loss: 1.1692, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2269, loss: 1.0826, batch_reg_loss: 0.0685, reg_loss: 0.0681 ||: 46%|####5 | 51/111 [00:35<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7492, UAS: 0.9047, LAS: 0.8305, UEM: 0.4617, LEM: 0.2330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8205, partial_loss/deprel_loss: 1.8595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9202, loss: 1.1140, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||: 49%|####8 | 54/111 [00:37<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7964, UAS: 0.9034, LAS: 0.8291, UEM: 0.4487, LEM: 0.2257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2039, partial_loss/deprel_loss: 1.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3791, loss: 1.1273, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||: 51%|#####1 | 57/111 [00:39<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7435, UAS: 0.9016, LAS: 0.8268, UEM: 0.4383, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2836, partial_loss/deprel_loss: 1.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9936, loss: 1.1479, batch_reg_loss: 0.0687, reg_loss: 0.0682 ||: 55%|#####4 | 61/111 [00:42<00:34, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8348, UAS: 0.9023, LAS: 0.8278, UEM: 0.4403, LEM: 0.2168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 1.0006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 1.1379, batch_reg_loss: 0.0688, reg_loss: 0.0682 ||: 58%|#####7 | 64/111 [00:44<00:32, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9030, LAS: 0.8286, UEM: 0.4388, LEM: 0.2130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.7770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7944, loss: 1.1308, batch_reg_loss: 0.0689, reg_loss: 0.0682 ||: 60%|###### | 67/111 [00:46<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9032, LAS: 0.8287, UEM: 0.4419, LEM: 0.2154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3263, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 1.1277, batch_reg_loss: 0.0689, reg_loss: 0.0683 ||: 63%|######3 | 70/111 [00:48<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9024, LAS: 0.8277, UEM: 0.4353, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6941, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 1.1377, batch_reg_loss: 0.0690, reg_loss: 0.0683 ||: 66%|######5 | 73/111 [00:50<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7257, UAS: 0.9023, LAS: 0.8276, UEM: 0.4461, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5688, partial_loss/deprel_loss: 1.8292, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0462, loss: 1.1387, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||: 68%|######8 | 76/111 [00:52<00:24, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9029, LAS: 0.8282, UEM: 0.4496, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4104, partial_loss/deprel_loss: 0.7276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7332, loss: 1.1344, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||: 71%|#######1 | 79/111 [00:55<00:22, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9011, LAS: 0.8263, UEM: 0.4404, LEM: 0.2131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4546, partial_loss/deprel_loss: 1.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3746, loss: 1.1528, batch_reg_loss: 0.0692, reg_loss: 0.0684 ||: 75%|#######4 | 83/111 [00:57<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.9006, LAS: 0.8256, UEM: 0.4416, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9790, partial_loss/deprel_loss: 1.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9498, loss: 1.1586, batch_reg_loss: 0.0693, reg_loss: 0.0684 ||: 77%|#######7 | 86/111 [00:59<00:17, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9005, LAS: 0.8255, UEM: 0.4447, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4351, partial_loss/deprel_loss: 0.7105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7247, loss: 1.1604, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||: 81%|########1 | 90/111 [01:02<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9016, LAS: 0.8266, UEM: 0.4473, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4284, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 1.1503, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||: 84%|########3 | 93/111 [01:04<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9025, LAS: 0.8278, UEM: 0.4611, LEM: 0.2269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3530, partial_loss/deprel_loss: 1.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3427, loss: 1.1401, batch_reg_loss: 0.0695, reg_loss: 0.0685 ||: 86%|########6 | 96/111 [01:06<00:10, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9011, LAS: 0.8262, UEM: 0.4614, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.5647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 1.1574, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||: 90%|######### | 100/111 [01:08<00:07, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7670, UAS: 0.9000, LAS: 0.8250, UEM: 0.4556, LEM: 0.2241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6908, partial_loss/deprel_loss: 1.5468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6452, loss: 1.1669, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||: 94%|#########3| 104/111 [01:11<00:04, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.8997, LAS: 0.8246, UEM: 0.4485, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9835, partial_loss/deprel_loss: 1.0113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 1.1688, batch_reg_loss: 0.0697, reg_loss: 0.0686 ||: 97%|#########7| 108/111 [01:13<00:01, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8993, LAS: 0.8241, UEM: 0.4477, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3591, partial_loss/deprel_loss: 0.6441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 1.1728, batch_reg_loss: 0.0698, reg_loss: 0.0687 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:04:21,844 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9091, LAS: 0.8425, UEM: 0.5537, LEM: 0.2550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4429, partial_loss/deprel_loss: 25.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 20.5353, loss: 33.4054, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:12, 1.17s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9252, LAS: 0.8642, UEM: 0.6450, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 19.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9139, loss: 26.8195, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:05<00:08, 1.10s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9317, LAS: 0.8693, UEM: 0.6302, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5259, partial_loss/deprel_loss: 23.7138, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0762, loss: 25.0754, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:08<00:05, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9354, LAS: 0.8720, UEM: 0.6148, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0366, partial_loss/deprel_loss: 42.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 34.3200, loss: 24.3461, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:02, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9327, LAS: 0.8688, UEM: 0.5809, LEM: 0.3203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1886, partial_loss/deprel_loss: 48.1446, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7534, loss: 25.3898, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.644 | 48.145\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.359 | 1.189\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - reg_loss | 0.069 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UEM | 0.448 | 0.581\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LAS | 0.824 | 0.869\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - loss | 1.173 | 25.390\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEM | 0.218 | 0.320\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UAS | 0.899 | 0.933\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EM | 0.879 | 0.844\n", + "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Epoch duration: 0:01:28.011201\n", + "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Estimated training time remaining: 8:42:55\n", + "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Epoch 11/399\n", + "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:04:34,529 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7318, UAS: 0.9023, LAS: 0.8266, UEM: 0.6184, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2381, partial_loss/deprel_loss: 1.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0035, loss: 1.1306, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||: 3%|2 | 3/111 [00:02<01:23, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9063, LAS: 0.8290, UEM: 0.4976, LEM: 0.2240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 1.1307, batch_reg_loss: 0.0699, reg_loss: 0.0699 ||: 5%|5 | 6/111 [00:04<01:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9103, LAS: 0.8362, UEM: 0.4687, LEM: 0.1954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1053, partial_loss/deprel_loss: 1.2357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2797, loss: 1.0641, batch_reg_loss: 0.0700, reg_loss: 0.0699 ||: 9%|9 | 10/111 [00:06<01:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7896, UAS: 0.9057, LAS: 0.8323, UEM: 0.4223, LEM: 0.1711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5511, partial_loss/deprel_loss: 1.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4978, loss: 1.0987, batch_reg_loss: 0.0701, reg_loss: 0.0700 ||: 12%|#1 | 13/111 [00:08<01:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7038, UAS: 0.8933, LAS: 0.8198, UEM: 0.4015, LEM: 0.1612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3903, partial_loss/deprel_loss: 2.1584, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4749, loss: 1.2235, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||: 15%|#5 | 17/111 [00:11<01:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.8926, LAS: 0.8186, UEM: 0.3850, LEM: 0.1549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5808, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8557, loss: 1.2307, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||: 18%|#8 | 20/111 [00:13<01:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8979, LAS: 0.8248, UEM: 0.4068, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4397, partial_loss/deprel_loss: 0.6836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 1.1735, batch_reg_loss: 0.0703, reg_loss: 0.0701 ||: 21%|## | 23/111 [00:16<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9013, LAS: 0.8287, UEM: 0.4106, LEM: 0.1665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.9933, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0037, loss: 1.1421, batch_reg_loss: 0.0704, reg_loss: 0.0701 ||: 24%|##4 | 27/111 [00:18<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9032, LAS: 0.8303, UEM: 0.4190, LEM: 0.1744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 1.1172, batch_reg_loss: 0.0705, reg_loss: 0.0701 ||: 28%|##7 | 31/111 [00:21<00:54, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9035, LAS: 0.8302, UEM: 0.4089, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6362, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8333, loss: 1.1133, batch_reg_loss: 0.0705, reg_loss: 0.0702 ||: 31%|### | 34/111 [00:23<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9044, LAS: 0.8316, UEM: 0.4279, LEM: 0.1793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.6374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6515, loss: 1.1019, batch_reg_loss: 0.0706, reg_loss: 0.0702 ||: 34%|###4 | 38/111 [00:25<00:47, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8177, UAS: 0.9025, LAS: 0.8289, UEM: 0.4126, LEM: 0.1706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0452, partial_loss/deprel_loss: 1.1970, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2373, loss: 1.1266, batch_reg_loss: 0.0707, reg_loss: 0.0703 ||: 38%|###7 | 42/111 [00:28<00:44, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.9022, LAS: 0.8284, UEM: 0.3981, LEM: 0.1621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1751, partial_loss/deprel_loss: 1.1391, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2171, loss: 1.1310, batch_reg_loss: 0.0708, reg_loss: 0.0703 ||: 41%|####1 | 46/111 [00:30<00:40, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9036, LAS: 0.8304, UEM: 0.4308, LEM: 0.1934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6100, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 1.1156, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||: 45%|####5 | 50/111 [00:33<00:40, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7861, UAS: 0.8996, LAS: 0.8257, UEM: 0.4162, LEM: 0.1863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4086, partial_loss/deprel_loss: 1.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5223, loss: 1.1565, batch_reg_loss: 0.0709, reg_loss: 0.0704 ||: 49%|####8 | 54/111 [00:36<00:38, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9003, LAS: 0.8264, UEM: 0.4200, LEM: 0.1901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 1.1513, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||: 51%|#####1 | 57/111 [00:39<00:40, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.8989, LAS: 0.8248, UEM: 0.4080, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4330, partial_loss/deprel_loss: 1.2713, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3747, loss: 1.1698, batch_reg_loss: 0.0711, reg_loss: 0.0705 ||: 55%|#####4 | 61/111 [00:41<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8991, LAS: 0.8250, UEM: 0.4074, LEM: 0.1823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.6930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.1708, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||: 58%|#####7 | 64/111 [00:43<00:32, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9010, LAS: 0.8273, UEM: 0.4541, LEM: 0.2326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 1.1522, batch_reg_loss: 0.0713, reg_loss: 0.0705 ||: 60%|###### | 67/111 [00:46<00:33, 1.30it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9019, LAS: 0.8284, UEM: 0.4523, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5616, partial_loss/deprel_loss: 0.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 1.1425, batch_reg_loss: 0.0713, reg_loss: 0.0706 ||: 63%|######3 | 70/111 [00:48<00:30, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9028, LAS: 0.8292, UEM: 0.4489, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.8075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8344, loss: 1.1331, batch_reg_loss: 0.0714, reg_loss: 0.0706 ||: 67%|######6 | 74/111 [00:51<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8455, UAS: 0.9026, LAS: 0.8289, UEM: 0.4483, LEM: 0.2209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7892, partial_loss/deprel_loss: 0.9486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 1.1360, batch_reg_loss: 0.0715, reg_loss: 0.0706 ||: 69%|######9 | 77/111 [00:53<00:24, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9023, LAS: 0.8285, UEM: 0.4494, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5825, partial_loss/deprel_loss: 1.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.1386, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||: 72%|#######2 | 80/111 [00:55<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7285, UAS: 0.9020, LAS: 0.8283, UEM: 0.4558, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6126, partial_loss/deprel_loss: 1.8106, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0426, loss: 1.1390, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||: 75%|#######4 | 83/111 [00:57<00:21, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9022, LAS: 0.8285, UEM: 0.4532, LEM: 0.2213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4983, partial_loss/deprel_loss: 0.8175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.1382, batch_reg_loss: 0.0717, reg_loss: 0.0707 ||: 78%|#######8 | 87/111 [01:00<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9024, LAS: 0.8289, UEM: 0.4612, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4406, partial_loss/deprel_loss: 0.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 1.1361, batch_reg_loss: 0.0718, reg_loss: 0.0708 ||: 82%|########1 | 91/111 [01:03<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9021, LAS: 0.8285, UEM: 0.4575, LEM: 0.2255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4676, partial_loss/deprel_loss: 1.4466, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5226, loss: 1.1405, batch_reg_loss: 0.0719, reg_loss: 0.0708 ||: 86%|########5 | 95/111 [01:05<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7878, UAS: 0.9016, LAS: 0.8278, UEM: 0.4487, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5254, partial_loss/deprel_loss: 1.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5499, loss: 1.1483, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||: 89%|########9 | 99/111 [01:08<00:08, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8066, UAS: 0.9015, LAS: 0.8276, UEM: 0.4439, LEM: 0.2164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1248, partial_loss/deprel_loss: 1.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2587, loss: 1.1491, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||: 93%|#########2| 103/111 [01:10<00:05, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9024, LAS: 0.8286, UEM: 0.4471, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0125, loss: 1.1405, batch_reg_loss: 0.0721, reg_loss: 0.0710 ||: 96%|#########6| 107/111 [01:12<00:02, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.844 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 2.120 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - reg_loss | 0.071 | N/A\n", + "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UEM | 0.451 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LAS | 0.829 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - loss | 1.141 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEM | 0.220 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - UAS | 0.902 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EM | 0.750 | N/A\n", + "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Epoch duration: 0:01:15.582589\n", + "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Estimated training time remaining: 8:38:50\n", + "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Epoch 12/399\n", + "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:05:50,112 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9145, LAS: 0.8453, UEM: 0.4518, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4663, partial_loss/deprel_loss: 0.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7723, loss: 1.0488, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||: 3%|2 | 3/111 [00:02<01:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9059, LAS: 0.8377, UEM: 0.5846, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6475, partial_loss/deprel_loss: 0.8195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8574, loss: 1.0996, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||: 5%|5 | 6/111 [00:04<01:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9139, LAS: 0.8456, UEM: 0.5705, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6774, loss: 1.0076, batch_reg_loss: 0.0724, reg_loss: 0.0723 ||: 8%|8 | 9/111 [00:06<01:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9174, LAS: 0.8482, UEM: 0.5739, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3122, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6293, loss: 0.9715, batch_reg_loss: 0.0725, reg_loss: 0.0723 ||: 11%|# | 12/111 [00:08<01:13, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8221, UAS: 0.9104, LAS: 0.8398, UEM: 0.5355, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0309, partial_loss/deprel_loss: 1.0752, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1389, loss: 1.0415, batch_reg_loss: 0.0725, reg_loss: 0.0724 ||: 14%|#3 | 15/111 [00:11<01:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9067, LAS: 0.8371, UEM: 0.5688, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8351, partial_loss/deprel_loss: 0.9804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0239, loss: 1.0859, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||: 16%|#6 | 18/111 [00:13<01:10, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9099, LAS: 0.8394, UEM: 0.5595, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5296, partial_loss/deprel_loss: 0.7868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8080, loss: 1.0573, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||: 19%|#8 | 21/111 [00:15<01:05, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9070, LAS: 0.8361, UEM: 0.5278, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5860, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8579, loss: 1.0872, batch_reg_loss: 0.0727, reg_loss: 0.0725 ||: 23%|##2 | 25/111 [00:17<00:59, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9108, LAS: 0.8402, UEM: 0.5494, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7324, partial_loss/deprel_loss: 0.9558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9839, loss: 1.0478, batch_reg_loss: 0.0728, reg_loss: 0.0725 ||: 25%|##5 | 28/111 [00:20<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8217, UAS: 0.9095, LAS: 0.8378, UEM: 0.5353, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9042, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1834, loss: 1.0668, batch_reg_loss: 0.0729, reg_loss: 0.0726 ||: 29%|##8 | 32/111 [00:22<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9101, LAS: 0.8382, UEM: 0.5166, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5087, partial_loss/deprel_loss: 0.8009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 1.0627, batch_reg_loss: 0.0730, reg_loss: 0.0726 ||: 32%|###2 | 36/111 [00:25<00:49, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9089, LAS: 0.8370, UEM: 0.5070, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3822, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4248, loss: 1.0717, batch_reg_loss: 0.0731, reg_loss: 0.0726 ||: 36%|###6 | 40/111 [00:27<00:46, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9101, LAS: 0.8384, UEM: 0.5297, LEM: 0.2952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2709, loss: 1.0596, batch_reg_loss: 0.0731, reg_loss: 0.0727 ||: 40%|###9 | 44/111 [00:30<00:47, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9088, LAS: 0.8368, UEM: 0.5236, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3538, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 1.0727, batch_reg_loss: 0.0732, reg_loss: 0.0727 ||: 43%|####3 | 48/111 [00:33<00:44, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9072, LAS: 0.8350, UEM: 0.5092, LEM: 0.2833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 1.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3859, loss: 1.0896, batch_reg_loss: 0.0733, reg_loss: 0.0728 ||: 46%|####5 | 51/111 [00:36<00:43, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9088, LAS: 0.8370, UEM: 0.5143, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8776, partial_loss/deprel_loss: 1.0180, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0633, loss: 1.0735, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||: 49%|####8 | 54/111 [00:38<00:43, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7273, UAS: 0.9077, LAS: 0.8359, UEM: 0.5105, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6504, partial_loss/deprel_loss: 1.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0438, loss: 1.0829, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||: 51%|#####1 | 57/111 [00:40<00:39, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7544, UAS: 0.9065, LAS: 0.8341, UEM: 0.4990, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8573, partial_loss/deprel_loss: 1.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8378, loss: 1.0979, batch_reg_loss: 0.0735, reg_loss: 0.0729 ||: 54%|#####4 | 60/111 [00:42<00:37, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7376, UAS: 0.9049, LAS: 0.8321, UEM: 0.4968, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1506, partial_loss/deprel_loss: 1.7339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8908, loss: 1.1161, batch_reg_loss: 0.0736, reg_loss: 0.0729 ||: 57%|#####6 | 63/111 [00:45<00:35, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7635, UAS: 0.9050, LAS: 0.8323, UEM: 0.4953, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9722, partial_loss/deprel_loss: 1.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7789, loss: 1.1152, batch_reg_loss: 0.0737, reg_loss: 0.0729 ||: 60%|###### | 67/111 [00:47<00:31, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9055, LAS: 0.8327, UEM: 0.4957, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5937, loss: 1.1123, batch_reg_loss: 0.0737, reg_loss: 0.0730 ||: 63%|######3 | 70/111 [00:50<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9058, LAS: 0.8332, UEM: 0.4880, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6342, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8317, loss: 1.1077, batch_reg_loss: 0.0738, reg_loss: 0.0730 ||: 67%|######6 | 74/111 [00:52<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9068, LAS: 0.8343, UEM: 0.4830, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7012, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9318, loss: 1.0977, batch_reg_loss: 0.0739, reg_loss: 0.0731 ||: 70%|####### | 78/111 [00:54<00:21, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9070, LAS: 0.8342, UEM: 0.4768, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7163, partial_loss/deprel_loss: 0.9517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9786, loss: 1.0981, batch_reg_loss: 0.0740, reg_loss: 0.0731 ||: 74%|#######3 | 82/111 [00:57<00:19, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.9056, LAS: 0.8328, UEM: 0.4687, LEM: 0.2366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1859, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8147, loss: 1.1102, batch_reg_loss: 0.0741, reg_loss: 0.0731 ||: 77%|#######7 | 86/111 [00:59<00:15, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9051, LAS: 0.8322, UEM: 0.4610, LEM: 0.2306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6899, partial_loss/deprel_loss: 0.8140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8633, loss: 1.1154, batch_reg_loss: 0.0742, reg_loss: 0.0732 ||: 81%|########1 | 90/111 [01:02<00:13, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9056, LAS: 0.8328, UEM: 0.4617, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.5813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6080, loss: 1.1113, batch_reg_loss: 0.0743, reg_loss: 0.0732 ||: 85%|########4 | 94/111 [01:04<00:10, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9058, LAS: 0.8330, UEM: 0.4594, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8808, partial_loss/deprel_loss: 1.0929, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1248, loss: 1.1101, batch_reg_loss: 0.0743, reg_loss: 0.0733 ||: 88%|########8 | 98/111 [01:07<00:08, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9059, LAS: 0.8333, UEM: 0.4644, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.6404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6920, loss: 1.1069, batch_reg_loss: 0.0744, reg_loss: 0.0733 ||: 92%|#########1| 102/111 [01:09<00:05, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9051, LAS: 0.8326, UEM: 0.4572, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.9381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 1.1119, batch_reg_loss: 0.0745, reg_loss: 0.0734 ||: 95%|#########5| 106/111 [01:12<00:03, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9062, LAS: 0.8339, UEM: 0.4675, LEM: 0.2349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0885, partial_loss/deprel_loss: 1.1797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0998, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||: 99%|#########9| 110/111 [01:15<00:00, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9061, LAS: 0.8338, UEM: 0.4655, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1674, loss: 1.1004, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:07:05,881 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.110 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.023 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - reg_loss | 0.073 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UEM | 0.465 | N/A\n", + "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - LAS | 0.834 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - loss | 1.100 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEM | 0.233 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - UAS | 0.906 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EM | 0.820 | N/A\n", + "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Epoch duration: 0:01:15.777801\n", + "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Estimated training time remaining: 8:35:17\n", + "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Epoch 13/399\n", + "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:07:05,891 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8619, UEM: 0.4574, LEM: 0.1618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7100, partial_loss/deprel_loss: 0.9025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9387, loss: 0.8542, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||: 4%|3 | 4/111 [00:02<01:05, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9274, LAS: 0.8577, UEM: 0.5495, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5867, partial_loss/deprel_loss: 0.8378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8624, loss: 0.9059, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||: 6%|6 | 7/111 [00:04<01:06, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9324, LAS: 0.8661, UEM: 0.6490, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 0.9270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.8396, batch_reg_loss: 0.0748, reg_loss: 0.0747 ||: 9%|9 | 10/111 [00:07<01:10, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9237, LAS: 0.8552, UEM: 0.6107, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5861, partial_loss/deprel_loss: 0.8717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8895, loss: 0.9147, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||: 12%|#1 | 13/111 [00:09<01:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9197, LAS: 0.8506, UEM: 0.5745, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3641, partial_loss/deprel_loss: 0.6230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6461, loss: 0.9695, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||: 15%|#5 | 17/111 [00:11<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9151, LAS: 0.8442, UEM: 0.5264, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1686, partial_loss/deprel_loss: 1.2195, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2844, loss: 1.0252, batch_reg_loss: 0.0750, reg_loss: 0.0748 ||: 19%|#8 | 21/111 [00:13<00:57, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8267, UAS: 0.9124, LAS: 0.8413, UEM: 0.4941, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0154, partial_loss/deprel_loss: 1.0660, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1310, loss: 1.0460, batch_reg_loss: 0.0751, reg_loss: 0.0749 ||: 23%|##2 | 25/111 [00:16<00:53, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8238, UAS: 0.9086, LAS: 0.8368, UEM: 0.4664, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0240, partial_loss/deprel_loss: 1.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2887, loss: 1.0848, batch_reg_loss: 0.0752, reg_loss: 0.0749 ||: 26%|##6 | 29/111 [00:18<00:49, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9055, LAS: 0.8337, UEM: 0.4621, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6710, loss: 1.1165, batch_reg_loss: 0.0753, reg_loss: 0.0749 ||: 30%|##9 | 33/111 [00:21<00:49, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9073, LAS: 0.8363, UEM: 0.4795, LEM: 0.2514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6131, partial_loss/deprel_loss: 0.7515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 1.0915, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||: 33%|###3 | 37/111 [00:24<00:49, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7761, UAS: 0.9057, LAS: 0.8346, UEM: 0.4668, LEM: 0.2435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8575, partial_loss/deprel_loss: 1.3668, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5404, loss: 1.1023, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||: 36%|###6 | 40/111 [00:26<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.9043, LAS: 0.8329, UEM: 0.4531, LEM: 0.2340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5114, partial_loss/deprel_loss: 1.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5020, loss: 1.1203, batch_reg_loss: 0.0755, reg_loss: 0.0751 ||: 40%|###9 | 44/111 [00:29<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9052, LAS: 0.8341, UEM: 0.4580, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0554, loss: 1.1106, batch_reg_loss: 0.0756, reg_loss: 0.0751 ||: 43%|####3 | 48/111 [00:31<00:41, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9044, LAS: 0.8330, UEM: 0.4435, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.9511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 1.1189, batch_reg_loss: 0.0757, reg_loss: 0.0752 ||: 47%|####6 | 52/111 [00:34<00:38, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8000, UAS: 0.9029, LAS: 0.8312, UEM: 0.4362, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5169, partial_loss/deprel_loss: 1.3667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4725, loss: 1.1357, batch_reg_loss: 0.0758, reg_loss: 0.0752 ||: 50%|##### | 56/111 [00:36<00:36, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7002, UAS: 0.9022, LAS: 0.8304, UEM: 0.4436, LEM: 0.2236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2238, partial_loss/deprel_loss: 2.1219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4182, loss: 1.1438, batch_reg_loss: 0.0759, reg_loss: 0.0752 ||: 54%|#####4 | 60/111 [00:39<00:33, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9040, LAS: 0.8323, UEM: 0.4516, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6981, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9721, loss: 1.1264, batch_reg_loss: 0.0760, reg_loss: 0.0753 ||: 58%|#####7 | 64/111 [00:41<00:30, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9055, LAS: 0.8341, UEM: 0.4556, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4415, partial_loss/deprel_loss: 0.7414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 1.1101, batch_reg_loss: 0.0761, reg_loss: 0.0753 ||: 61%|######1 | 68/111 [00:44<00:28, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9040, LAS: 0.8328, UEM: 0.4447, LEM: 0.2207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7093, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8168, loss: 1.1185, batch_reg_loss: 0.0762, reg_loss: 0.0754 ||: 65%|######4 | 72/111 [00:47<00:25, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9043, LAS: 0.8333, UEM: 0.4447, LEM: 0.2198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2306, partial_loss/deprel_loss: 1.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2224, loss: 1.1130, batch_reg_loss: 0.0763, reg_loss: 0.0754 ||: 68%|######8 | 76/111 [00:50<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9062, LAS: 0.8355, UEM: 0.4584, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2390, partial_loss/deprel_loss: 0.4781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 1.0937, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||: 72%|#######2 | 80/111 [00:53<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8032, UAS: 0.9060, LAS: 0.8351, UEM: 0.4538, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3960, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4506, loss: 1.0980, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||: 75%|#######4 | 83/111 [00:55<00:19, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9050, LAS: 0.8337, UEM: 0.4466, LEM: 0.2208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3930, partial_loss/deprel_loss: 1.3680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4495, loss: 1.1114, batch_reg_loss: 0.0765, reg_loss: 0.0755 ||: 77%|#######7 | 86/111 [00:57<00:17, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9049, LAS: 0.8336, UEM: 0.4501, LEM: 0.2231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3639, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6060, loss: 1.1125, batch_reg_loss: 0.0765, reg_loss: 0.0756 ||: 80%|######## | 89/111 [00:59<00:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9055, LAS: 0.8343, UEM: 0.4625, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.6558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 1.1064, batch_reg_loss: 0.0766, reg_loss: 0.0756 ||: 84%|########3 | 93/111 [01:02<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9057, LAS: 0.8346, UEM: 0.4606, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0815, partial_loss/deprel_loss: 1.1541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2163, loss: 1.1032, batch_reg_loss: 0.0767, reg_loss: 0.0757 ||: 87%|########7 | 97/111 [01:04<00:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9064, LAS: 0.8353, UEM: 0.4631, LEM: 0.2353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5644, partial_loss/deprel_loss: 0.7545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 1.0944, batch_reg_loss: 0.0768, reg_loss: 0.0757 ||: 90%|######### | 100/111 [01:07<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9071, LAS: 0.8359, UEM: 0.4619, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4491, partial_loss/deprel_loss: 0.7446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 1.0887, batch_reg_loss: 0.0769, reg_loss: 0.0757 ||: 94%|#########3| 104/111 [01:09<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9075, LAS: 0.8365, UEM: 0.4599, LEM: 0.2282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.9821, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 1.0846, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||: 97%|#########7| 108/111 [01:12<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9079, LAS: 0.8370, UEM: 0.4689, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.6604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.0791, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.660 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.501 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - reg_loss | 0.076 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UEM | 0.469 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LAS | 0.837 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - loss | 1.079 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEM | 0.236 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - UAS | 0.908 | N/A\n", + "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - EM | 0.877 | N/A\n", + "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:08:20,321 - INFO - combo.training.trainer - Epoch duration: 0:01:14.437484\n", + "2023-04-06 23:08:20,322 - INFO - combo.training.trainer - Estimated training time remaining: 8:31:27\n", + "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Epoch 14/399\n", + "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:08:20,328 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9050, LAS: 0.8322, UEM: 0.3462, LEM: 0.1412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 1.1053, batch_reg_loss: 0.0771, reg_loss: 0.0771 ||: 4%|3 | 4/111 [00:02<01:09, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9247, LAS: 0.8550, UEM: 0.5441, LEM: 0.2661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2521, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.9122, batch_reg_loss: 0.0772, reg_loss: 0.0771 ||: 6%|6 | 7/111 [00:04<01:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9159, LAS: 0.8477, UEM: 0.6024, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8878, partial_loss/deprel_loss: 0.9722, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0326, loss: 0.9816, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||: 9%|9 | 10/111 [00:06<01:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9164, LAS: 0.8477, UEM: 0.5390, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8523, partial_loss/deprel_loss: 0.9885, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0386, loss: 0.9758, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||: 13%|#2 | 14/111 [00:09<01:03, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9110, LAS: 0.8412, UEM: 0.5185, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9668, partial_loss/deprel_loss: 1.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6841, loss: 1.0342, batch_reg_loss: 0.0774, reg_loss: 0.0772 ||: 15%|#5 | 17/111 [00:11<01:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9141, LAS: 0.8444, UEM: 0.5072, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 1.0093, batch_reg_loss: 0.0775, reg_loss: 0.0773 ||: 19%|#8 | 21/111 [00:14<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9116, LAS: 0.8416, UEM: 0.4865, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0877, partial_loss/deprel_loss: 1.1095, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1827, loss: 1.0410, batch_reg_loss: 0.0776, reg_loss: 0.0773 ||: 23%|##2 | 25/111 [00:16<00:57, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9061, LAS: 0.8356, UEM: 0.4625, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.8587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9058, loss: 1.0970, batch_reg_loss: 0.0777, reg_loss: 0.0774 ||: 26%|##6 | 29/111 [00:19<00:52, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9051, LAS: 0.8340, UEM: 0.4469, LEM: 0.2211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0395, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1441, loss: 1.1120, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||: 30%|##9 | 33/111 [00:21<00:50, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9085, LAS: 0.8382, UEM: 0.4764, LEM: 0.2406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.6205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 1.0744, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||: 32%|###2 | 36/111 [00:24<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9108, LAS: 0.8411, UEM: 0.4902, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6145, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 1.0500, batch_reg_loss: 0.0779, reg_loss: 0.0775 ||: 36%|###6 | 40/111 [00:26<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9124, LAS: 0.8426, UEM: 0.4984, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3140, partial_loss/deprel_loss: 0.5344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5684, loss: 1.0315, batch_reg_loss: 0.0780, reg_loss: 0.0775 ||: 40%|###9 | 44/111 [00:29<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9119, LAS: 0.8419, UEM: 0.4840, LEM: 0.2437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9631, partial_loss/deprel_loss: 1.0249, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0907, loss: 1.0371, batch_reg_loss: 0.0781, reg_loss: 0.0776 ||: 42%|####2 | 47/111 [00:31<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9133, LAS: 0.8437, UEM: 0.4948, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4537, loss: 1.0207, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||: 46%|####5 | 51/111 [00:34<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7901, UAS: 0.9129, LAS: 0.8434, UEM: 0.4891, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6952, partial_loss/deprel_loss: 1.4274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5592, loss: 1.0256, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||: 49%|####8 | 54/111 [00:36<00:40, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9121, LAS: 0.8425, UEM: 0.4933, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 1.0326, batch_reg_loss: 0.0783, reg_loss: 0.0777 ||: 52%|#####2 | 58/111 [00:39<00:37, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9113, LAS: 0.8415, UEM: 0.4846, LEM: 0.2433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6334, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9019, loss: 1.0366, batch_reg_loss: 0.0784, reg_loss: 0.0777 ||: 56%|#####5 | 62/111 [00:41<00:33, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9111, LAS: 0.8413, UEM: 0.4800, LEM: 0.2409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 1.0415, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||: 59%|#####8 | 65/111 [00:44<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7980, UAS: 0.9108, LAS: 0.8410, UEM: 0.4735, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4804, partial_loss/deprel_loss: 1.3567, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4600, loss: 1.0455, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||: 61%|######1 | 68/111 [00:46<00:30, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7880, UAS: 0.9112, LAS: 0.8414, UEM: 0.4779, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6517, partial_loss/deprel_loss: 1.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5415, loss: 1.0425, batch_reg_loss: 0.0786, reg_loss: 0.0778 ||: 64%|######3 | 71/111 [00:48<00:29, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9119, LAS: 0.8426, UEM: 0.4984, LEM: 0.2679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2941, loss: 1.0349, batch_reg_loss: 0.0786, reg_loss: 0.0779 ||: 67%|######6 | 74/111 [00:50<00:27, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7983, UAS: 0.9113, LAS: 0.8419, UEM: 0.4900, LEM: 0.2614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4769, partial_loss/deprel_loss: 1.3341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4414, loss: 1.0420, batch_reg_loss: 0.0787, reg_loss: 0.0779 ||: 70%|####### | 78/111 [00:53<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.9108, LAS: 0.8416, UEM: 0.4961, LEM: 0.2649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2212, partial_loss/deprel_loss: 2.0886, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3939, loss: 1.0457, batch_reg_loss: 0.0788, reg_loss: 0.0779 ||: 74%|#######3 | 82/111 [00:56<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9102, LAS: 0.8409, UEM: 0.4893, LEM: 0.2593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6706, partial_loss/deprel_loss: 0.8114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8622, loss: 1.0496, batch_reg_loss: 0.0789, reg_loss: 0.0780 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9103, LAS: 0.8411, UEM: 0.4857, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4870, partial_loss/deprel_loss: 1.3774, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4783, loss: 1.0499, batch_reg_loss: 0.0790, reg_loss: 0.0780 ||: 81%|########1 | 90/111 [01:01<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9096, LAS: 0.8401, UEM: 0.4780, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9445, loss: 1.0577, batch_reg_loss: 0.0791, reg_loss: 0.0781 ||: 85%|########4 | 94/111 [01:03<00:10, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9107, LAS: 0.8414, UEM: 0.4827, LEM: 0.2505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6406, partial_loss/deprel_loss: 0.8061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 1.0448, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||: 88%|########8 | 98/111 [01:06<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8037, UAS: 0.9103, LAS: 0.8410, UEM: 0.4798, LEM: 0.2484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2133, partial_loss/deprel_loss: 1.2041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.0474, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||: 91%|######### | 101/111 [01:08<00:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9088, LAS: 0.8395, UEM: 0.4738, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0699, partial_loss/deprel_loss: 1.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7770, loss: 1.0608, batch_reg_loss: 0.0793, reg_loss: 0.0782 ||: 94%|#########3| 104/111 [01:11<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8128, UAS: 0.9079, LAS: 0.8384, UEM: 0.4676, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1866, partial_loss/deprel_loss: 1.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3208, loss: 1.0707, batch_reg_loss: 0.0794, reg_loss: 0.0782 ||: 96%|#########6| 107/111 [01:13<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.627 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.394 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - reg_loss | 0.078 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UEM | 0.474 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - LAS | 0.840 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - loss | 1.059 | N/A\n", + "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEM | 0.244 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - UAS | 0.909 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EM | 0.879 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Epoch duration: 0:01:15.855623\n", + "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Estimated training time remaining: 8:28:34\n", + "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Epoch 15/399\n", + "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:09:36,183 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9129, LAS: 0.8471, UEM: 0.5121, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.5037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5505, loss: 1.0156, batch_reg_loss: 0.0795, reg_loss: 0.0795 ||: 3%|2 | 3/111 [00:02<01:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9213, LAS: 0.8539, UEM: 0.5395, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6728, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8665, loss: 0.9328, batch_reg_loss: 0.0796, reg_loss: 0.0796 ||: 6%|6 | 7/111 [00:04<01:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9119, LAS: 0.8434, UEM: 0.4963, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8418, loss: 1.0238, batch_reg_loss: 0.0797, reg_loss: 0.0796 ||: 9%|9 | 10/111 [00:06<01:08, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9158, LAS: 0.8482, UEM: 0.4947, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4600, partial_loss/deprel_loss: 0.6518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6932, loss: 0.9811, batch_reg_loss: 0.0798, reg_loss: 0.0796 ||: 13%|#2 | 14/111 [00:09<01:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9126, LAS: 0.8430, UEM: 0.4992, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 1.0350, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||: 16%|#6 | 18/111 [00:11<01:01, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9172, LAS: 0.8487, UEM: 0.5242, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3962, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.9883, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||: 19%|#8 | 21/111 [00:14<01:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9172, LAS: 0.8486, UEM: 0.5373, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4394, partial_loss/deprel_loss: 0.6408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6805, loss: 0.9807, batch_reg_loss: 0.0800, reg_loss: 0.0797 ||: 22%|##1 | 24/111 [00:16<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9188, LAS: 0.8518, UEM: 0.5242, LEM: 0.2712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.6435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.9584, batch_reg_loss: 0.0801, reg_loss: 0.0798 ||: 25%|##5 | 28/111 [00:19<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9203, LAS: 0.8540, UEM: 0.5249, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5017, loss: 0.9409, batch_reg_loss: 0.0802, reg_loss: 0.0798 ||: 29%|##8 | 32/111 [00:21<00:54, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9190, LAS: 0.8522, UEM: 0.5190, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3828, partial_loss/deprel_loss: 1.3768, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4582, loss: 0.9604, batch_reg_loss: 0.0802, reg_loss: 0.0799 ||: 32%|###1 | 35/111 [00:23<00:52, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7389, UAS: 0.9176, LAS: 0.8506, UEM: 0.5181, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2919, partial_loss/deprel_loss: 1.6833, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8853, loss: 0.9725, batch_reg_loss: 0.0803, reg_loss: 0.0799 ||: 34%|###4 | 38/111 [00:26<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9187, LAS: 0.8517, UEM: 0.5193, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3254, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9599, batch_reg_loss: 0.0804, reg_loss: 0.0799 ||: 37%|###6 | 41/111 [00:28<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9194, LAS: 0.8522, UEM: 0.5159, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.9546, batch_reg_loss: 0.0804, reg_loss: 0.0800 ||: 40%|###9 | 44/111 [00:30<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9198, LAS: 0.8526, UEM: 0.5182, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4518, partial_loss/deprel_loss: 0.7032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.9497, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||: 42%|####2 | 47/111 [00:32<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9207, LAS: 0.8539, UEM: 0.5335, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1517, partial_loss/deprel_loss: 0.3182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.9379, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||: 45%|####5 | 50/111 [00:34<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9215, LAS: 0.8548, UEM: 0.5430, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 1.0522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1027, loss: 0.9278, batch_reg_loss: 0.0806, reg_loss: 0.0801 ||: 48%|####7 | 53/111 [00:37<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9200, LAS: 0.8530, UEM: 0.5317, LEM: 0.2759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.8304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.9473, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9206, LAS: 0.8537, UEM: 0.5313, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5806, loss: 0.9414, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9210, LAS: 0.8541, UEM: 0.5338, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9455, partial_loss/deprel_loss: 1.0358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0985, loss: 0.9351, batch_reg_loss: 0.0808, reg_loss: 0.0802 ||: 57%|#####6 | 63/111 [00:43<00:34, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7807, UAS: 0.9184, LAS: 0.8511, UEM: 0.5201, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6969, partial_loss/deprel_loss: 1.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5876, loss: 0.9608, batch_reg_loss: 0.0809, reg_loss: 0.0802 ||: 60%|###### | 67/111 [00:46<00:30, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7824, UAS: 0.9154, LAS: 0.8479, UEM: 0.5090, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7713, partial_loss/deprel_loss: 1.3922, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5490, loss: 0.9869, batch_reg_loss: 0.0810, reg_loss: 0.0802 ||: 64%|######3 | 71/111 [00:49<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9155, LAS: 0.8480, UEM: 0.5164, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1790, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4386, loss: 0.9870, batch_reg_loss: 0.0811, reg_loss: 0.0803 ||: 68%|######7 | 75/111 [00:51<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9141, LAS: 0.8463, UEM: 0.5077, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6719, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 1.0058, batch_reg_loss: 0.0812, reg_loss: 0.0803 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7749, UAS: 0.9124, LAS: 0.8444, UEM: 0.4999, LEM: 0.2572, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7582, partial_loss/deprel_loss: 1.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5744, loss: 1.0213, batch_reg_loss: 0.0812, reg_loss: 0.0804 ||: 74%|#######3 | 82/111 [00:56<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9121, LAS: 0.8439, UEM: 0.4934, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.7789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8214, loss: 1.0266, batch_reg_loss: 0.0813, reg_loss: 0.0804 ||: 77%|#######6 | 85/111 [00:58<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9122, LAS: 0.8440, UEM: 0.4887, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7833, partial_loss/deprel_loss: 1.0462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0750, loss: 1.0278, batch_reg_loss: 0.0814, reg_loss: 0.0804 ||: 80%|######## | 89/111 [01:01<00:14, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9112, LAS: 0.8429, UEM: 0.4808, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5965, partial_loss/deprel_loss: 0.7940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0355, batch_reg_loss: 0.0815, reg_loss: 0.0805 ||: 84%|########3 | 93/111 [01:03<00:11, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9112, LAS: 0.8426, UEM: 0.4752, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4334, loss: 1.0376, batch_reg_loss: 0.0816, reg_loss: 0.0805 ||: 87%|########7 | 97/111 [01:05<00:08, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9109, LAS: 0.8420, UEM: 0.4715, LEM: 0.2341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6782, partial_loss/deprel_loss: 0.8343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 1.0429, batch_reg_loss: 0.0817, reg_loss: 0.0806 ||: 91%|######### | 101/111 [01:08<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9114, LAS: 0.8427, UEM: 0.4907, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8753, partial_loss/deprel_loss: 1.6942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8122, loss: 1.0390, batch_reg_loss: 0.0818, reg_loss: 0.0806 ||: 95%|#########4| 105/111 [01:11<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9112, LAS: 0.8426, UEM: 0.4832, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.2117, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3270, loss: 1.0401, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||: 98%|#########8| 109/111 [01:14<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9112, LAS: 0.8424, UEM: 0.4790, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8623, partial_loss/deprel_loss: 1.0124, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 1.0407, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:10:51,901 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9633, LAS: 0.9155, UEM: 0.8426, LEM: 0.6012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2034, partial_loss/deprel_loss: 20.0996, partial_loss/cycle_loss: 0.0000, batch_loss: 16.1204, loss: 18.3759, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8487, UAS: 0.9482, LAS: 0.8943, UEM: 0.7481, LEM: 0.4864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1447, partial_loss/deprel_loss: 48.1773, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7708, loss: 23.6897, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 31%|### | 4/13 [00:04<00:09, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9460, LAS: 0.8896, UEM: 0.6815, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5206, partial_loss/deprel_loss: 23.6872, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0539, loss: 21.7025, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:06<00:05, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9392, LAS: 0.8802, UEM: 0.6161, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0001, partial_loss/deprel_loss: 36.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 29.2929, loss: 24.2677, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:09<00:02, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9333, LAS: 0.8731, UEM: 0.5785, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 29.1962, partial_loss/cycle_loss: 0.0000, batch_loss: 23.5160, loss: 26.0322, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:01, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9363, LAS: 0.8771, UEM: 0.6121, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 23.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 18.4698, loss: 25.4504, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.012 | 23.031\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.862 | 0.224\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - reg_loss | 0.081 | 0.000\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UEM | 0.479 | 0.612\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LAS | 0.842 | 0.877\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - loss | 1.041 | 25.450\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEM | 0.247 | 0.344\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UAS | 0.911 | 0.936\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EM | 0.839 | 0.925\n", + "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Epoch duration: 0:01:28.335274\n", + "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Estimated training time remaining: 8:30:52\n", + "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Epoch 16/399\n", + "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:11:04,519 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7589, UAS: 0.9080, LAS: 0.8432, UEM: 0.5846, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2122, partial_loss/deprel_loss: 1.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7785, loss: 1.0280, batch_reg_loss: 0.0820, reg_loss: 0.0820 ||: 3%|2 | 3/111 [00:02<01:22, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9242, LAS: 0.8615, UEM: 0.5455, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6915, partial_loss/deprel_loss: 0.7745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8400, loss: 0.8831, batch_reg_loss: 0.0821, reg_loss: 0.0820 ||: 6%|6 | 7/111 [00:04<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9154, LAS: 0.8499, UEM: 0.4670, LEM: 0.2081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9397, partial_loss/deprel_loss: 1.1732, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2086, loss: 1.0023, batch_reg_loss: 0.0822, reg_loss: 0.0821 ||: 9%|9 | 10/111 [00:06<01:12, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8657, UAS: 0.9175, LAS: 0.8510, UEM: 0.4862, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5694, partial_loss/deprel_loss: 0.7629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8065, loss: 0.9746, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||: 13%|#2 | 14/111 [00:09<01:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9107, LAS: 0.8442, UEM: 0.4501, LEM: 0.1969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7070, partial_loss/deprel_loss: 0.7876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8538, loss: 1.0366, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||: 16%|#6 | 18/111 [00:11<01:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9177, LAS: 0.8516, UEM: 0.5343, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5199, loss: 0.9668, batch_reg_loss: 0.0824, reg_loss: 0.0822 ||: 20%|#9 | 22/111 [00:14<00:58, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9192, LAS: 0.8529, UEM: 0.5322, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6265, loss: 0.9500, batch_reg_loss: 0.0825, reg_loss: 0.0822 ||: 23%|##2 | 25/111 [00:16<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9144, LAS: 0.8473, UEM: 0.5001, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9402, partial_loss/deprel_loss: 1.0992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1499, loss: 1.0039, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||: 26%|##6 | 29/111 [00:19<00:54, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9124, LAS: 0.8448, UEM: 0.4943, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6395, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8791, loss: 1.0205, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||: 30%|##9 | 33/111 [00:21<00:50, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9116, LAS: 0.8445, UEM: 0.4757, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1420, partial_loss/deprel_loss: 1.1341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2184, loss: 1.0229, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||: 32%|###2 | 36/111 [00:23<00:49, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9109, LAS: 0.8433, UEM: 0.4713, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.6151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 1.0294, batch_reg_loss: 0.0828, reg_loss: 0.0824 ||: 36%|###6 | 40/111 [00:26<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9110, LAS: 0.8432, UEM: 0.4799, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.8820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9484, loss: 1.0291, batch_reg_loss: 0.0829, reg_loss: 0.0824 ||: 39%|###8 | 43/111 [00:28<00:47, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7958, UAS: 0.9110, LAS: 0.8432, UEM: 0.4756, LEM: 0.2299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3631, partial_loss/deprel_loss: 1.3073, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4014, loss: 1.0309, batch_reg_loss: 0.0829, reg_loss: 0.0825 ||: 41%|####1 | 46/111 [00:30<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9128, LAS: 0.8450, UEM: 0.4773, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.9011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9440, loss: 1.0167, batch_reg_loss: 0.0830, reg_loss: 0.0825 ||: 44%|####4 | 49/111 [00:33<00:44, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9116, LAS: 0.8436, UEM: 0.4651, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6289, partial_loss/deprel_loss: 0.8555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8933, loss: 1.0315, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||: 48%|####7 | 53/111 [00:35<00:39, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.9112, LAS: 0.8430, UEM: 0.4520, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 1.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3202, loss: 1.0350, batch_reg_loss: 0.0832, reg_loss: 0.0826 ||: 51%|#####1 | 57/111 [00:38<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9118, LAS: 0.8436, UEM: 0.4508, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.6971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 1.0315, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||: 55%|#####4 | 61/111 [00:40<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9122, LAS: 0.8440, UEM: 0.4514, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0268, partial_loss/deprel_loss: 1.1379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1990, loss: 1.0293, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||: 58%|#####7 | 64/111 [00:43<00:32, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9126, LAS: 0.8445, UEM: 0.4557, LEM: 0.2132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3577, partial_loss/deprel_loss: 0.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5768, loss: 1.0256, batch_reg_loss: 0.0834, reg_loss: 0.0827 ||: 61%|######1 | 68/111 [00:45<00:29, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9138, LAS: 0.8459, UEM: 0.4563, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6427, partial_loss/deprel_loss: 0.9296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9557, loss: 1.0155, batch_reg_loss: 0.0835, reg_loss: 0.0827 ||: 65%|######4 | 72/111 [00:48<00:26, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9128, LAS: 0.8448, UEM: 0.4481, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9213, partial_loss/deprel_loss: 0.9996, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0676, loss: 1.0238, batch_reg_loss: 0.0836, reg_loss: 0.0828 ||: 68%|######8 | 76/111 [00:50<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9138, LAS: 0.8463, UEM: 0.4699, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3683, loss: 1.0118, batch_reg_loss: 0.0837, reg_loss: 0.0828 ||: 72%|#######2 | 80/111 [00:53<00:20, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7485, UAS: 0.9127, LAS: 0.8450, UEM: 0.4712, LEM: 0.2295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4496, partial_loss/deprel_loss: 1.8294, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0372, loss: 1.0233, batch_reg_loss: 0.0838, reg_loss: 0.0829 ||: 76%|#######5 | 84/111 [00:56<00:17, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9140, LAS: 0.8467, UEM: 0.4935, LEM: 0.2568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.2183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2751, loss: 1.0081, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||: 79%|#######9 | 88/111 [00:59<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9135, LAS: 0.8460, UEM: 0.4869, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4877, partial_loss/deprel_loss: 0.7291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 1.0140, batch_reg_loss: 0.0840, reg_loss: 0.0830 ||: 83%|########2 | 92/111 [01:01<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9137, LAS: 0.8462, UEM: 0.4900, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0775, partial_loss/deprel_loss: 1.0943, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1750, loss: 1.0106, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||: 86%|########6 | 96/111 [01:04<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9119, LAS: 0.8443, UEM: 0.4847, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0740, partial_loss/deprel_loss: 1.0761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1598, loss: 1.0296, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||: 89%|########9 | 99/111 [01:07<00:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9125, LAS: 0.8451, UEM: 0.4915, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1448, loss: 1.0224, batch_reg_loss: 0.0842, reg_loss: 0.0831 ||: 92%|#########1| 102/111 [01:09<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9125, LAS: 0.8449, UEM: 0.4885, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4391, partial_loss/deprel_loss: 0.6192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6675, loss: 1.0221, batch_reg_loss: 0.0843, reg_loss: 0.0831 ||: 95%|#########4| 105/111 [01:11<00:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9127, LAS: 0.8451, UEM: 0.4833, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6720, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8609, loss: 1.0200, batch_reg_loss: 0.0844, reg_loss: 0.0831 ||: 98%|#########8| 109/111 [01:13<00:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9127, LAS: 0.8451, UEM: 0.4802, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.8870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9131, loss: 1.0210, batch_reg_loss: 0.0844, reg_loss: 0.0832 ||: 100%|##########| 111/111 [01:14<00:00, 1.48it/s]\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.887 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.595 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - reg_loss | 0.083 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UEM | 0.480 | N/A\n", + "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - LAS | 0.845 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - loss | 1.021 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEM | 0.246 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - UAS | 0.913 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EM | 0.864 | N/A\n", + "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Epoch duration: 0:01:14.940605\n", + "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Estimated training time remaining: 8:27:43\n", + "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Epoch 17/399\n", + "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:12:19,461 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9216, LAS: 0.8554, UEM: 0.3382, LEM: 0.1011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5816, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.9648, batch_reg_loss: 0.0845, reg_loss: 0.0845 ||: 4%|3 | 4/111 [00:02<01:04, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9265, LAS: 0.8618, UEM: 0.3934, LEM: 0.1398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8730, loss: 0.8968, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||: 6%|6 | 7/111 [00:04<01:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9162, LAS: 0.8500, UEM: 0.3532, LEM: 0.1257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0305, partial_loss/deprel_loss: 0.9789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0739, loss: 0.9920, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||: 9%|9 | 10/111 [00:06<01:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8026, UAS: 0.9184, LAS: 0.8528, UEM: 0.4350, LEM: 0.1899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3660, partial_loss/deprel_loss: 1.2370, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3475, loss: 0.9582, batch_reg_loss: 0.0847, reg_loss: 0.0846 ||: 12%|#1 | 13/111 [00:08<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9205, LAS: 0.8554, UEM: 0.4904, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4147, partial_loss/deprel_loss: 0.5218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.9331, batch_reg_loss: 0.0848, reg_loss: 0.0846 ||: 15%|#5 | 17/111 [00:11<01:02, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9219, LAS: 0.8575, UEM: 0.5308, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1652, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4877, loss: 0.9235, batch_reg_loss: 0.0849, reg_loss: 0.0846 ||: 18%|#8 | 20/111 [00:13<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8204, UAS: 0.9207, LAS: 0.8556, UEM: 0.5155, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1489, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2139, loss: 0.9339, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||: 22%|##1 | 24/111 [00:16<00:57, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9208, LAS: 0.8555, UEM: 0.4917, LEM: 0.2469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7885, partial_loss/deprel_loss: 0.9084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.9335, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||: 25%|##5 | 28/111 [00:18<00:52, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9203, LAS: 0.8549, UEM: 0.4892, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2998, partial_loss/deprel_loss: 0.5312, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.9418, batch_reg_loss: 0.0851, reg_loss: 0.0848 ||: 28%|##7 | 31/111 [00:20<00:53, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8699, UAS: 0.9203, LAS: 0.8548, UEM: 0.4730, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5786, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.9400, batch_reg_loss: 0.0852, reg_loss: 0.0848 ||: 32%|###1 | 35/111 [00:23<00:50, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9223, LAS: 0.8573, UEM: 0.4940, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.9204, batch_reg_loss: 0.0853, reg_loss: 0.0849 ||: 34%|###4 | 38/111 [00:25<00:50, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9217, LAS: 0.8563, UEM: 0.4839, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5008, partial_loss/deprel_loss: 0.7724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8034, loss: 0.9291, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||: 38%|###7 | 42/111 [00:27<00:45, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9206, LAS: 0.8548, UEM: 0.4822, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 0.9410, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||: 41%|#### | 45/111 [00:30<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9174, LAS: 0.8517, UEM: 0.4643, LEM: 0.2239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0294, loss: 0.9654, batch_reg_loss: 0.0855, reg_loss: 0.0850 ||: 44%|####4 | 49/111 [00:32<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9165, LAS: 0.8508, UEM: 0.4653, LEM: 0.2219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8402, partial_loss/deprel_loss: 0.8455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9301, loss: 0.9775, batch_reg_loss: 0.0856, reg_loss: 0.0850 ||: 48%|####7 | 53/111 [00:35<00:38, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9179, LAS: 0.8524, UEM: 0.4743, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8424, partial_loss/deprel_loss: 0.9273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.9632, batch_reg_loss: 0.0857, reg_loss: 0.0851 ||: 51%|#####1 | 57/111 [00:37<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9181, LAS: 0.8528, UEM: 0.4839, LEM: 0.2345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.9589, batch_reg_loss: 0.0858, reg_loss: 0.0851 ||: 55%|#####4 | 61/111 [00:40<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9201, LAS: 0.8551, UEM: 0.5090, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4550, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7183, loss: 0.9397, batch_reg_loss: 0.0859, reg_loss: 0.0852 ||: 59%|#####8 | 65/111 [00:43<00:30, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9196, LAS: 0.8545, UEM: 0.5017, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6634, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8311, loss: 0.9431, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||: 62%|######2 | 69/111 [00:46<00:28, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9189, LAS: 0.8537, UEM: 0.4995, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4002, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.9510, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||: 65%|######4 | 72/111 [00:48<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9195, LAS: 0.8542, UEM: 0.5001, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.9440, batch_reg_loss: 0.0861, reg_loss: 0.0853 ||: 68%|######8 | 76/111 [00:50<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9161, LAS: 0.8505, UEM: 0.4923, LEM: 0.2467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8969, loss: 0.9753, batch_reg_loss: 0.0862, reg_loss: 0.0853 ||: 72%|#######2 | 80/111 [00:53<00:20, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8143, UAS: 0.9160, LAS: 0.8504, UEM: 0.4899, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3190, partial_loss/deprel_loss: 1.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3258, loss: 0.9778, batch_reg_loss: 0.0863, reg_loss: 0.0854 ||: 76%|#######5 | 84/111 [00:55<00:17, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7646, UAS: 0.9146, LAS: 0.8487, UEM: 0.4840, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9803, partial_loss/deprel_loss: 1.4948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6783, loss: 0.9919, batch_reg_loss: 0.0864, reg_loss: 0.0854 ||: 79%|#######9 | 88/111 [00:57<00:14, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9150, LAS: 0.8493, UEM: 0.5098, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0973, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2956, loss: 0.9903, batch_reg_loss: 0.0865, reg_loss: 0.0855 ||: 83%|########2 | 92/111 [01:01<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9145, LAS: 0.8486, UEM: 0.5008, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1653, partial_loss/deprel_loss: 1.1575, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2456, loss: 0.9977, batch_reg_loss: 0.0866, reg_loss: 0.0855 ||: 86%|########6 | 96/111 [01:05<00:11, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8094, UAS: 0.9144, LAS: 0.8484, UEM: 0.4967, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3131, partial_loss/deprel_loss: 1.1735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2881, loss: 0.9981, batch_reg_loss: 0.0867, reg_loss: 0.0855 ||: 89%|########9 | 99/111 [01:07<00:09, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8428, UAS: 0.9144, LAS: 0.8483, UEM: 0.4979, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8804, partial_loss/deprel_loss: 1.0840, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1300, loss: 0.9994, batch_reg_loss: 0.0867, reg_loss: 0.0856 ||: 92%|#########1| 102/111 [01:09<00:06, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9148, LAS: 0.8489, UEM: 0.4973, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4124, partial_loss/deprel_loss: 0.5711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6262, loss: 0.9941, batch_reg_loss: 0.0868, reg_loss: 0.0856 ||: 95%|#########4| 105/111 [01:12<00:04, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9151, LAS: 0.8490, UEM: 0.4923, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8749, loss: 0.9937, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||: 98%|#########8| 109/111 [01:14<00:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8040, UAS: 0.9140, LAS: 0.8479, UEM: 0.4885, LEM: 0.2549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3149, partial_loss/deprel_loss: 1.1623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2798, loss: 1.0035, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:13:34,894 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.162 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.315 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - reg_loss | 0.086 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UEM | 0.489 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - LAS | 0.848 | N/A\n", + "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - loss | 1.004 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEM | 0.255 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - UAS | 0.914 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EM | 0.804 | N/A\n", + "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Epoch duration: 0:01:15.442752\n", + "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Estimated training time remaining: 8:24:56\n", + "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Epoch 18/399\n", + "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:13:34,904 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8228, UAS: 0.9169, LAS: 0.8505, UEM: 0.3212, LEM: 0.0933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 1.1094, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1928, loss: 0.9545, batch_reg_loss: 0.0870, reg_loss: 0.0870 ||: 3%|2 | 3/111 [00:02<01:20, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9276, LAS: 0.8623, UEM: 0.5231, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.5087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5591, loss: 0.8390, batch_reg_loss: 0.0871, reg_loss: 0.0870 ||: 5%|5 | 6/111 [00:04<01:20, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9346, LAS: 0.8740, UEM: 0.6711, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1051, partial_loss/deprel_loss: 0.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2839, loss: 0.7732, batch_reg_loss: 0.0872, reg_loss: 0.0871 ||: 9%|9 | 10/111 [00:07<01:17, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9301, LAS: 0.8680, UEM: 0.6054, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6862, partial_loss/deprel_loss: 0.8887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9355, loss: 0.8377, batch_reg_loss: 0.0873, reg_loss: 0.0871 ||: 13%|#2 | 14/111 [00:10<01:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9300, LAS: 0.8676, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5562, partial_loss/deprel_loss: 0.6804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7430, loss: 0.8469, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||: 16%|#6 | 18/111 [00:12<01:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9308, LAS: 0.8677, UEM: 0.5772, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 0.4864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.8475, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||: 20%|#9 | 22/111 [00:15<01:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9230, LAS: 0.8594, UEM: 0.5669, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3768, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.9163, batch_reg_loss: 0.0875, reg_loss: 0.0872 ||: 23%|##2 | 25/111 [00:17<01:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8352, UAS: 0.9221, LAS: 0.8583, UEM: 0.5419, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 1.1264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.9262, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||: 25%|##5 | 28/111 [00:19<00:57, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9203, LAS: 0.8562, UEM: 0.5457, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3203, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.9386, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||: 28%|##7 | 31/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9183, LAS: 0.8538, UEM: 0.5326, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9560, partial_loss/deprel_loss: 0.9772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9626, batch_reg_loss: 0.0877, reg_loss: 0.0874 ||: 32%|###1 | 35/111 [00:24<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9185, LAS: 0.8543, UEM: 0.5263, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.9598, batch_reg_loss: 0.0878, reg_loss: 0.0874 ||: 35%|###5 | 39/111 [00:27<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9138, LAS: 0.8490, UEM: 0.5170, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5910, loss: 1.0039, batch_reg_loss: 0.0879, reg_loss: 0.0874 ||: 39%|###8 | 43/111 [00:29<00:47, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9152, LAS: 0.8507, UEM: 0.5210, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.9916, batch_reg_loss: 0.0880, reg_loss: 0.0875 ||: 41%|####1 | 46/111 [00:32<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8042, UAS: 0.9142, LAS: 0.8494, UEM: 0.5098, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3450, partial_loss/deprel_loss: 1.1223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2549, loss: 0.9971, batch_reg_loss: 0.0881, reg_loss: 0.0875 ||: 44%|####4 | 49/111 [00:34<00:44, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9148, LAS: 0.8502, UEM: 0.5006, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7142, loss: 0.9906, batch_reg_loss: 0.0882, reg_loss: 0.0876 ||: 48%|####7 | 53/111 [00:36<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9139, LAS: 0.8492, UEM: 0.4906, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7870, loss: 0.9980, batch_reg_loss: 0.0883, reg_loss: 0.0876 ||: 51%|#####1 | 57/111 [00:39<00:35, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7875, UAS: 0.9122, LAS: 0.8470, UEM: 0.4822, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5783, partial_loss/deprel_loss: 1.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.0136, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||: 55%|#####4 | 61/111 [00:41<00:33, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9123, LAS: 0.8474, UEM: 0.4979, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 1.0101, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||: 59%|#####8 | 65/111 [00:44<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9124, LAS: 0.8475, UEM: 0.4922, LEM: 0.2636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3323, partial_loss/deprel_loss: 1.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4005, loss: 1.0098, batch_reg_loss: 0.0885, reg_loss: 0.0877 ||: 61%|######1 | 68/111 [00:46<00:29, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9130, LAS: 0.8481, UEM: 0.4973, LEM: 0.2674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1742, partial_loss/deprel_loss: 1.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2885, loss: 1.0040, batch_reg_loss: 0.0886, reg_loss: 0.0878 ||: 64%|######3 | 71/111 [00:48<00:27, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9135, LAS: 0.8489, UEM: 0.5123, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.3012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3576, loss: 0.9980, batch_reg_loss: 0.0887, reg_loss: 0.0878 ||: 68%|######7 | 75/111 [00:51<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9134, LAS: 0.8486, UEM: 0.5078, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7427, partial_loss/deprel_loss: 0.9010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 1.0009, batch_reg_loss: 0.0887, reg_loss: 0.0879 ||: 70%|####### | 78/111 [00:53<00:23, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7803, UAS: 0.9131, LAS: 0.8483, UEM: 0.5069, LEM: 0.2774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8427, partial_loss/deprel_loss: 1.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7260, loss: 1.0046, batch_reg_loss: 0.0888, reg_loss: 0.0879 ||: 73%|#######2 | 81/111 [00:56<00:21, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8095, UAS: 0.9134, LAS: 0.8483, UEM: 0.5000, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2830, partial_loss/deprel_loss: 1.1385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2563, loss: 1.0034, batch_reg_loss: 0.0889, reg_loss: 0.0879 ||: 77%|#######6 | 85/111 [00:58<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9131, LAS: 0.8480, UEM: 0.4932, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.8970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9682, loss: 1.0072, batch_reg_loss: 0.0890, reg_loss: 0.0880 ||: 80%|######## | 89/111 [01:00<00:14, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9132, LAS: 0.8480, UEM: 0.4909, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3357, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5952, loss: 1.0083, batch_reg_loss: 0.0891, reg_loss: 0.0880 ||: 84%|########3 | 93/111 [01:03<00:11, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9140, LAS: 0.8488, UEM: 0.4943, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.7979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.0029, batch_reg_loss: 0.0892, reg_loss: 0.0881 ||: 87%|########7 | 97/111 [01:06<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9135, LAS: 0.8483, UEM: 0.4857, LEM: 0.2584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1926, partial_loss/deprel_loss: 1.1354, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0052, batch_reg_loss: 0.0893, reg_loss: 0.0881 ||: 91%|######### | 101/111 [01:08<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8649, UAS: 0.9144, LAS: 0.8493, UEM: 0.4890, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6948, partial_loss/deprel_loss: 0.8095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8759, loss: 0.9975, batch_reg_loss: 0.0893, reg_loss: 0.0882 ||: 94%|#########3| 104/111 [01:11<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8489, UAS: 0.9143, LAS: 0.8492, UEM: 0.4848, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9411, partial_loss/deprel_loss: 0.8917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9910, loss: 0.9983, batch_reg_loss: 0.0894, reg_loss: 0.0882 ||: 96%|#########6| 107/111 [01:13<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9151, LAS: 0.8501, UEM: 0.4914, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3863, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6691, loss: 0.9898, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||: 99%|#########9| 110/111 [01:15<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9153, LAS: 0.8503, UEM: 0.4906, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.8068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.9886, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.807 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.570 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - reg_loss | 0.088 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UEM | 0.491 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LAS | 0.850 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - loss | 0.989 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LEM | 0.257 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - UAS | 0.915 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EM | 0.870 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:14:50,916 - INFO - combo.training.trainer - Epoch duration: 0:01:16.019608\n", + "2023-04-06 23:14:50,917 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:31\n", + "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Epoch 19/399\n", + "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:14:50,923 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9280, LAS: 0.8663, UEM: 0.4818, LEM: 0.2052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.5427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5920, loss: 0.8326, batch_reg_loss: 0.0896, reg_loss: 0.0896 ||: 4%|3 | 4/111 [00:02<01:06, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9147, LAS: 0.8502, UEM: 0.3867, LEM: 0.1510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0561, partial_loss/deprel_loss: 1.0243, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1203, loss: 0.9958, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||: 6%|6 | 7/111 [00:04<01:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7890, UAS: 0.9112, LAS: 0.8450, UEM: 0.3595, LEM: 0.1344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5057, partial_loss/deprel_loss: 1.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5460, loss: 1.0469, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||: 9%|9 | 10/111 [00:06<01:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9132, LAS: 0.8471, UEM: 0.3635, LEM: 0.1282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8014, partial_loss/deprel_loss: 0.8880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9604, loss: 1.0209, batch_reg_loss: 0.0898, reg_loss: 0.0897 ||: 12%|#1 | 13/111 [00:08<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8711, UAS: 0.9142, LAS: 0.8481, UEM: 0.3500, LEM: 0.1202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5703, partial_loss/deprel_loss: 0.7201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7801, loss: 1.0151, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||: 15%|#5 | 17/111 [00:11<01:02, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9147, LAS: 0.8485, UEM: 0.3594, LEM: 0.1297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 1.1270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2538, loss: 1.0083, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||: 18%|#8 | 20/111 [00:13<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9089, LAS: 0.8422, UEM: 0.3288, LEM: 0.1173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0613, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0698, loss: 1.0639, batch_reg_loss: 0.0900, reg_loss: 0.0898 ||: 22%|##1 | 24/111 [00:16<00:57, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9075, LAS: 0.8401, UEM: 0.3043, LEM: 0.1081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1332, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2239, loss: 1.0805, batch_reg_loss: 0.0901, reg_loss: 0.0898 ||: 25%|##5 | 28/111 [00:18<00:54, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9118, LAS: 0.8454, UEM: 0.3797, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.4029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4631, loss: 1.0336, batch_reg_loss: 0.0902, reg_loss: 0.0899 ||: 28%|##7 | 31/111 [00:20<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9146, LAS: 0.8488, UEM: 0.4005, LEM: 0.1766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 1.0074, batch_reg_loss: 0.0903, reg_loss: 0.0899 ||: 32%|###1 | 35/111 [00:23<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9167, LAS: 0.8515, UEM: 0.4096, LEM: 0.1790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5449, partial_loss/deprel_loss: 0.7061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.9820, batch_reg_loss: 0.0904, reg_loss: 0.0899 ||: 35%|###5 | 39/111 [00:25<00:47, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9189, LAS: 0.8544, UEM: 0.4478, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.4174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.9584, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||: 38%|###7 | 42/111 [00:28<00:47, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8055, UAS: 0.9189, LAS: 0.8545, UEM: 0.4558, LEM: 0.2175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4937, partial_loss/deprel_loss: 1.2253, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3695, loss: 0.9560, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||: 41%|#### | 45/111 [00:30<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9134, LAS: 0.8488, UEM: 0.4408, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9478, partial_loss/deprel_loss: 1.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6940, loss: 1.0013, batch_reg_loss: 0.0906, reg_loss: 0.0901 ||: 44%|####4 | 49/111 [00:33<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9136, LAS: 0.8490, UEM: 0.4447, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.4641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 1.0002, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||: 47%|####6 | 52/111 [00:35<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9148, LAS: 0.8508, UEM: 0.4497, LEM: 0.2170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8531, partial_loss/deprel_loss: 0.7755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8818, loss: 0.9856, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||: 50%|####9 | 55/111 [00:37<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9144, LAS: 0.8503, UEM: 0.4407, LEM: 0.2094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4102, partial_loss/deprel_loss: 0.7027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.9948, batch_reg_loss: 0.0908, reg_loss: 0.0902 ||: 53%|#####3 | 59/111 [00:40<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9144, LAS: 0.8500, UEM: 0.4305, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7175, partial_loss/deprel_loss: 0.8354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9027, loss: 0.9954, batch_reg_loss: 0.0909, reg_loss: 0.0902 ||: 57%|#####6 | 63/111 [00:42<00:32, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9160, LAS: 0.8519, UEM: 0.4603, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1260, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3537, loss: 0.9770, batch_reg_loss: 0.0910, reg_loss: 0.0903 ||: 59%|#####9 | 66/111 [00:44<00:31, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9146, LAS: 0.8503, UEM: 0.4620, LEM: 0.2308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.5944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6387, loss: 0.9922, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||: 62%|######2 | 69/111 [00:47<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9152, LAS: 0.8511, UEM: 0.4865, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0865, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2703, loss: 0.9884, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||: 65%|######4 | 72/111 [00:49<00:29, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7450, UAS: 0.9129, LAS: 0.8483, UEM: 0.4786, LEM: 0.2592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4474, partial_loss/deprel_loss: 1.6060, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8655, loss: 1.0093, batch_reg_loss: 0.0912, reg_loss: 0.0904 ||: 68%|######7 | 75/111 [00:51<00:26, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9145, LAS: 0.8501, UEM: 0.4913, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3422, partial_loss/deprel_loss: 0.5563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6047, loss: 0.9942, batch_reg_loss: 0.0913, reg_loss: 0.0904 ||: 70%|####### | 78/111 [00:53<00:23, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8686, UAS: 0.9147, LAS: 0.8503, UEM: 0.4911, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8614, loss: 0.9942, batch_reg_loss: 0.0914, reg_loss: 0.0904 ||: 74%|#######3 | 82/111 [00:56<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9148, LAS: 0.8505, UEM: 0.4921, LEM: 0.2639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3560, partial_loss/deprel_loss: 1.2549, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3665, loss: 0.9919, batch_reg_loss: 0.0914, reg_loss: 0.0905 ||: 77%|#######6 | 85/111 [00:58<00:18, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8503, UAS: 0.9139, LAS: 0.8493, UEM: 0.4854, LEM: 0.2583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7237, partial_loss/deprel_loss: 0.8698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9321, loss: 1.0020, batch_reg_loss: 0.0915, reg_loss: 0.0905 ||: 80%|######## | 89/111 [01:01<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9132, LAS: 0.8486, UEM: 0.4798, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6280, partial_loss/deprel_loss: 1.2208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3938, loss: 1.0073, batch_reg_loss: 0.0916, reg_loss: 0.0905 ||: 83%|########2 | 92/111 [01:03<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9145, LAS: 0.8499, UEM: 0.4895, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4991, loss: 0.9969, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||: 86%|########5 | 95/111 [01:05<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8012, UAS: 0.9144, LAS: 0.8497, UEM: 0.4877, LEM: 0.2581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4152, partial_loss/deprel_loss: 1.2303, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3590, loss: 0.9990, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||: 88%|########8 | 98/111 [01:07<00:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9146, LAS: 0.8498, UEM: 0.4837, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.9972, batch_reg_loss: 0.0918, reg_loss: 0.0907 ||: 91%|######### | 101/111 [01:09<00:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9154, LAS: 0.8507, UEM: 0.4849, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6166, loss: 0.9904, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||: 95%|#########4| 105/111 [01:12<00:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9157, LAS: 0.8511, UEM: 0.4917, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.6486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.9860, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||: 97%|#########7| 108/111 [01:15<00:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:16:08,307 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.134 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.302 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - reg_loss | 0.091 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UEM | 0.494 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LAS | 0.851 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - loss | 0.984 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LEM | 0.260 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - UAS | 0.916 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EM | 0.810 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:16:08,309 - INFO - combo.training.trainer - Epoch duration: 0:01:17.392753\n", + "2023-04-06 23:16:08,310 - INFO - combo.training.trainer - Estimated training time remaining: 8:20:39\n", + "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Epoch 20/399\n", + "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:16:08,316 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9521, LAS: 0.8974, UEM: 0.7753, LEM: 0.6200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.6386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6190, batch_reg_loss: 0.0921, reg_loss: 0.0920 ||: 3%|2 | 3/111 [00:02<01:31, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7149, UAS: 0.9217, LAS: 0.8639, UEM: 0.7221, LEM: 0.5348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0170, partial_loss/deprel_loss: 1.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1901, loss: 0.8866, batch_reg_loss: 0.0921, reg_loss: 0.0921 ||: 6%|6 | 7/111 [00:04<01:20, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9203, LAS: 0.8612, UEM: 0.6885, LEM: 0.4941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2541, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5005, loss: 0.9092, batch_reg_loss: 0.0922, reg_loss: 0.0921 ||: 9%|9 | 10/111 [00:07<01:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9200, LAS: 0.8602, UEM: 0.6465, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9482, partial_loss/deprel_loss: 1.0288, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9218, batch_reg_loss: 0.0923, reg_loss: 0.0921 ||: 12%|#1 | 13/111 [00:09<01:13, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9260, LAS: 0.8667, UEM: 0.6404, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3305, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.8611, batch_reg_loss: 0.0923, reg_loss: 0.0922 ||: 15%|#5 | 17/111 [00:11<01:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9266, LAS: 0.8650, UEM: 0.6031, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6330, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8662, loss: 0.8658, batch_reg_loss: 0.0924, reg_loss: 0.0922 ||: 19%|#8 | 21/111 [00:14<01:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9235, LAS: 0.8615, UEM: 0.5818, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5684, partial_loss/deprel_loss: 0.7775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.8950, batch_reg_loss: 0.0925, reg_loss: 0.0923 ||: 22%|##1 | 24/111 [00:16<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9259, LAS: 0.8641, UEM: 0.5802, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.6752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7301, loss: 0.8726, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||: 24%|##4 | 27/111 [00:18<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9255, LAS: 0.8640, UEM: 0.5700, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.8753, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||: 27%|##7 | 30/111 [00:20<00:56, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9263, LAS: 0.8651, UEM: 0.5635, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5597, partial_loss/deprel_loss: 0.6210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7014, loss: 0.8682, batch_reg_loss: 0.0927, reg_loss: 0.0923 ||: 30%|##9 | 33/111 [00:22<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9252, LAS: 0.8637, UEM: 0.5582, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.5773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.8801, batch_reg_loss: 0.0927, reg_loss: 0.0924 ||: 32%|###2 | 36/111 [00:24<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9254, LAS: 0.8637, UEM: 0.5541, LEM: 0.3170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.7761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8396, loss: 0.8814, batch_reg_loss: 0.0928, reg_loss: 0.0924 ||: 35%|###5 | 39/111 [00:27<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9236, LAS: 0.8612, UEM: 0.5381, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 0.9462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0529, loss: 0.9042, batch_reg_loss: 0.0929, reg_loss: 0.0924 ||: 38%|###7 | 42/111 [00:29<00:50, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9249, LAS: 0.8627, UEM: 0.5504, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8873, partial_loss/deprel_loss: 1.0102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0786, loss: 0.8923, batch_reg_loss: 0.0929, reg_loss: 0.0925 ||: 41%|#### | 45/111 [00:31<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9246, LAS: 0.8622, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8750, partial_loss/deprel_loss: 0.9418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0214, loss: 0.8949, batch_reg_loss: 0.0930, reg_loss: 0.0925 ||: 44%|####4 | 49/111 [00:33<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9244, LAS: 0.8620, UEM: 0.5327, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7190, partial_loss/deprel_loss: 0.8342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9043, loss: 0.8976, batch_reg_loss: 0.0931, reg_loss: 0.0925 ||: 47%|####6 | 52/111 [00:35<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9237, LAS: 0.8612, UEM: 0.5251, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.6874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7233, loss: 0.9062, batch_reg_loss: 0.0931, reg_loss: 0.0926 ||: 50%|####9 | 55/111 [00:37<00:38, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9240, LAS: 0.8615, UEM: 0.5296, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3117, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.9034, batch_reg_loss: 0.0932, reg_loss: 0.0926 ||: 52%|#####2 | 58/111 [00:40<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9247, LAS: 0.8623, UEM: 0.5344, LEM: 0.2969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3854, partial_loss/deprel_loss: 0.5744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.8967, batch_reg_loss: 0.0933, reg_loss: 0.0926 ||: 55%|#####4 | 61/111 [00:42<00:35, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7501, UAS: 0.9220, LAS: 0.8592, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0578, partial_loss/deprel_loss: 1.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8619, loss: 0.9225, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||: 59%|#####8 | 65/111 [00:45<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9210, LAS: 0.8582, UEM: 0.5109, LEM: 0.2804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.9579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0274, loss: 0.9295, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||: 62%|######2 | 69/111 [00:47<00:27, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8715, UAS: 0.9208, LAS: 0.8578, UEM: 0.5065, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.7648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8241, loss: 0.9320, batch_reg_loss: 0.0935, reg_loss: 0.0928 ||: 66%|######5 | 73/111 [00:50<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9205, LAS: 0.8575, UEM: 0.5089, LEM: 0.2756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4596, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.9351, batch_reg_loss: 0.0936, reg_loss: 0.0928 ||: 69%|######9 | 77/111 [00:53<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9196, LAS: 0.8565, UEM: 0.5025, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3989, partial_loss/deprel_loss: 1.2230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3519, loss: 0.9459, batch_reg_loss: 0.0937, reg_loss: 0.0929 ||: 73%|#######2 | 81/111 [00:55<00:19, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9202, LAS: 0.8571, UEM: 0.5031, LEM: 0.2700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6244, loss: 0.9399, batch_reg_loss: 0.0938, reg_loss: 0.0929 ||: 77%|#######6 | 85/111 [00:57<00:16, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9193, LAS: 0.8562, UEM: 0.4962, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9018, partial_loss/deprel_loss: 1.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6089, loss: 0.9479, batch_reg_loss: 0.0939, reg_loss: 0.0929 ||: 80%|######## | 89/111 [01:01<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7733, UAS: 0.9190, LAS: 0.8557, UEM: 0.4967, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9213, partial_loss/deprel_loss: 1.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7167, loss: 0.9522, batch_reg_loss: 0.0940, reg_loss: 0.0930 ||: 83%|########2 | 92/111 [01:03<00:13, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8547, UAS: 0.9182, LAS: 0.8549, UEM: 0.4904, LEM: 0.2589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8669, loss: 0.9578, batch_reg_loss: 0.0941, reg_loss: 0.0930 ||: 86%|########6 | 96/111 [01:05<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8160, UAS: 0.9179, LAS: 0.8545, UEM: 0.4835, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3356, partial_loss/deprel_loss: 1.2480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9618, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||: 90%|######### | 100/111 [01:08<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9185, LAS: 0.8549, UEM: 0.4847, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8264, partial_loss/deprel_loss: 0.9697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0353, loss: 0.9581, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||: 93%|#########2| 103/111 [01:10<00:05, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9190, LAS: 0.8556, UEM: 0.5012, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1585, partial_loss/deprel_loss: 0.3249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3859, loss: 0.9525, batch_reg_loss: 0.0943, reg_loss: 0.0931 ||: 95%|#########5| 106/111 [01:12<00:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8343, UAS: 0.9174, LAS: 0.8537, UEM: 0.4963, LEM: 0.2666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9702, partial_loss/deprel_loss: 0.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0675, loss: 0.9691, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||: 98%|#########8| 109/111 [01:14<00:01, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9175, LAS: 0.8538, UEM: 0.4941, LEM: 0.2641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9358, partial_loss/deprel_loss: 0.9596, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0492, loss: 0.9684, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-06 23:17:24,438 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9379, LAS: 0.8819, UEM: 0.4929, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8324, partial_loss/deprel_loss: 30.4534, partial_loss/cycle_loss: 0.0000, batch_loss: 24.5292, loss: 22.6841, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8961, UEM: 0.7019, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4225, partial_loss/deprel_loss: 25.9318, partial_loss/cycle_loss: 0.0000, batch_loss: 20.8300, loss: 21.0524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:07, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9460, LAS: 0.8899, UEM: 0.6444, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6182, partial_loss/deprel_loss: 33.9471, partial_loss/cycle_loss: 0.0000, batch_loss: 27.2813, loss: 21.9483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9433, LAS: 0.8872, UEM: 0.6348, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1976, partial_loss/deprel_loss: 23.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 18.6898, loss: 24.3207, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:09<00:01, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9382, LAS: 0.8808, UEM: 0.6098, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5354, partial_loss/deprel_loss: 23.9953, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3033, loss: 25.6272, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00, 1.09it/s]\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.960 | 23.995\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.936 | 0.535\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - reg_loss | 0.093 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UEM | 0.494 | 0.610\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LAS | 0.854 | 0.881\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - loss | 0.968 | 25.627\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEM | 0.264 | 0.350\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UAS | 0.918 | 0.938\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EM | 0.845 | 0.885\n", + "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Epoch duration: 0:01:28.060274\n", + "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:02\n", + "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Epoch 21/399\n", + "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:17:36,371 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:17:36,376 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9258, LAS: 0.8623, UEM: 0.3812, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0052, partial_loss/deprel_loss: 0.9565, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9069, batch_reg_loss: 0.0945, reg_loss: 0.0944 ||: 3%|2 | 3/111 [00:02<01:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9203, LAS: 0.8558, UEM: 0.3611, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 0.9642, batch_reg_loss: 0.0946, reg_loss: 0.0945 ||: 6%|6 | 7/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8580, UAS: 0.9250, LAS: 0.8613, UEM: 0.3832, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8690, partial_loss/deprel_loss: 0.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.9139, batch_reg_loss: 0.0947, reg_loss: 0.0945 ||: 10%|9 | 11/111 [00:07<01:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9155, LAS: 0.8505, UEM: 0.3310, LEM: 0.1096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7844, partial_loss/deprel_loss: 0.8858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9602, loss: 0.9989, batch_reg_loss: 0.0947, reg_loss: 0.0946 ||: 14%|#3 | 15/111 [00:09<01:03, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8521, UAS: 0.9187, LAS: 0.8536, UEM: 0.3559, LEM: 0.1284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7069, partial_loss/deprel_loss: 0.9114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9654, loss: 0.9738, batch_reg_loss: 0.0948, reg_loss: 0.0946 ||: 17%|#7 | 19/111 [00:12<01:00, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9194, LAS: 0.8549, UEM: 0.3802, LEM: 0.1447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9340, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9937, loss: 0.9615, batch_reg_loss: 0.0949, reg_loss: 0.0947 ||: 21%|## | 23/111 [00:14<00:56, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9213, LAS: 0.8573, UEM: 0.4043, LEM: 0.1632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.9402, batch_reg_loss: 0.0950, reg_loss: 0.0947 ||: 24%|##4 | 27/111 [00:17<00:52, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9229, LAS: 0.8593, UEM: 0.4209, LEM: 0.1772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3523, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.9247, batch_reg_loss: 0.0951, reg_loss: 0.0948 ||: 28%|##7 | 31/111 [00:19<00:51, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9226, LAS: 0.8594, UEM: 0.4405, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7041, partial_loss/deprel_loss: 0.8753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9363, loss: 0.9259, batch_reg_loss: 0.0952, reg_loss: 0.0948 ||: 32%|###1 | 35/111 [00:22<00:48, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9234, LAS: 0.8603, UEM: 0.4429, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9610, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0052, loss: 0.9134, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||: 35%|###5 | 39/111 [00:25<00:46, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7296, UAS: 0.9207, LAS: 0.8576, UEM: 0.4694, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0297, partial_loss/deprel_loss: 1.8059, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1460, loss: 0.9392, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||: 38%|###7 | 42/111 [00:27<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9230, LAS: 0.8604, UEM: 0.4986, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.6117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6704, loss: 0.9153, batch_reg_loss: 0.0954, reg_loss: 0.0949 ||: 41%|#### | 45/111 [00:29<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8595, UAS: 0.9227, LAS: 0.8601, UEM: 0.4996, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7368, partial_loss/deprel_loss: 0.8730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.9158, batch_reg_loss: 0.0954, reg_loss: 0.0950 ||: 43%|####3 | 48/111 [00:31<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9213, LAS: 0.8584, UEM: 0.4874, LEM: 0.2479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9492, partial_loss/deprel_loss: 1.1123, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1752, loss: 0.9301, batch_reg_loss: 0.0955, reg_loss: 0.0950 ||: 46%|####5 | 51/111 [00:34<00:43, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9193, LAS: 0.8562, UEM: 0.4801, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.7754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8328, loss: 0.9488, batch_reg_loss: 0.0956, reg_loss: 0.0950 ||: 49%|####8 | 54/111 [00:36<00:41, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9175, LAS: 0.8539, UEM: 0.4693, LEM: 0.2347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2272, partial_loss/deprel_loss: 1.2433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3357, loss: 0.9674, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||: 52%|#####2 | 58/111 [00:38<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9193, LAS: 0.8564, UEM: 0.5091, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1029, partial_loss/deprel_loss: 0.2265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2975, loss: 0.9466, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||: 55%|#####4 | 61/111 [00:41<00:39, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9187, LAS: 0.8552, UEM: 0.4985, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6729, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8682, loss: 0.9533, batch_reg_loss: 0.0958, reg_loss: 0.0951 ||: 59%|#####8 | 65/111 [00:44<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9188, LAS: 0.8557, UEM: 0.4976, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3849, partial_loss/deprel_loss: 1.1817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3182, loss: 0.9503, batch_reg_loss: 0.0959, reg_loss: 0.0952 ||: 61%|######1 | 68/111 [00:46<00:30, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9184, LAS: 0.8552, UEM: 0.4954, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2846, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.9528, batch_reg_loss: 0.0960, reg_loss: 0.0952 ||: 65%|######4 | 72/111 [00:48<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9177, LAS: 0.8545, UEM: 0.4896, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9335, loss: 0.9619, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||: 68%|######8 | 76/111 [00:51<00:23, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8785, UAS: 0.9189, LAS: 0.8556, UEM: 0.4982, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6560, loss: 0.9503, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||: 71%|#######1 | 79/111 [00:54<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9170, LAS: 0.8532, UEM: 0.4909, LEM: 0.2626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7202, partial_loss/deprel_loss: 1.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6166, loss: 0.9708, batch_reg_loss: 0.0962, reg_loss: 0.0953 ||: 74%|#######3 | 82/111 [00:56<00:20, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.9167, LAS: 0.8527, UEM: 0.4814, LEM: 0.2560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9546, partial_loss/deprel_loss: 1.0401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1193, loss: 0.9757, batch_reg_loss: 0.0963, reg_loss: 0.0954 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9178, LAS: 0.8541, UEM: 0.4946, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.6831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7291, loss: 0.9636, batch_reg_loss: 0.0964, reg_loss: 0.0954 ||: 80%|######## | 89/111 [01:00<00:15, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9177, LAS: 0.8538, UEM: 0.4900, LEM: 0.2610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2122, partial_loss/deprel_loss: 1.0230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1573, loss: 0.9669, batch_reg_loss: 0.0965, reg_loss: 0.0954 ||: 83%|########2 | 92/111 [01:02<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9174, LAS: 0.8535, UEM: 0.4914, LEM: 0.2603, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3006, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.9690, batch_reg_loss: 0.0965, reg_loss: 0.0955 ||: 86%|########5 | 95/111 [01:04<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9168, LAS: 0.8528, UEM: 0.4893, LEM: 0.2586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4066, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.9755, batch_reg_loss: 0.0966, reg_loss: 0.0955 ||: 88%|########8 | 98/111 [01:07<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9167, LAS: 0.8525, UEM: 0.4840, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6369, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8077, loss: 0.9770, batch_reg_loss: 0.0967, reg_loss: 0.0955 ||: 91%|######### | 101/111 [01:09<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9169, LAS: 0.8528, UEM: 0.4859, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8818, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9210, loss: 0.9743, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||: 95%|#########4| 105/111 [01:11<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9174, LAS: 0.8535, UEM: 0.4861, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5777, partial_loss/deprel_loss: 0.8117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.9685, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||: 97%|#########7| 108/111 [01:14<00:02, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.821 | N/A\n", + "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.613 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - reg_loss | 0.096 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UEM | 0.494 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LAS | 0.854 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - loss | 0.961 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEM | 0.258 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UAS | 0.918 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EM | 0.867 | N/A\n", + "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Epoch duration: 0:01:16.752609\n", + "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Estimated training time remaining: 8:19:56\n", + "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Epoch 22/399\n", + "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:18:53,130 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9361, LAS: 0.8734, UEM: 0.4864, LEM: 0.2167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8275, partial_loss/deprel_loss: 0.8561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9474, loss: 0.8003, batch_reg_loss: 0.0970, reg_loss: 0.0970 ||: 4%|3 | 4/111 [00:02<00:57, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9300, LAS: 0.8699, UEM: 0.5067, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4623, partial_loss/deprel_loss: 1.1682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3241, loss: 0.8539, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||: 7%|7 | 8/111 [00:04<00:56, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9287, LAS: 0.8690, UEM: 0.4604, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7500, partial_loss/deprel_loss: 0.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9153, loss: 0.8580, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||: 11%|# | 12/111 [00:06<00:56, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9332, LAS: 0.8739, UEM: 0.5000, LEM: 0.2279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.8228, batch_reg_loss: 0.0972, reg_loss: 0.0971 ||: 14%|#3 | 15/111 [00:08<00:58, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9380, LAS: 0.8796, UEM: 0.5910, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4276, partial_loss/deprel_loss: 0.6461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.7743, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||: 16%|#6 | 18/111 [00:11<01:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9388, LAS: 0.8795, UEM: 0.5882, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5401, partial_loss/deprel_loss: 0.7525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8074, loss: 0.7672, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||: 19%|#8 | 21/111 [00:13<00:59, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9394, LAS: 0.8805, UEM: 0.5959, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8269, partial_loss/deprel_loss: 0.9416, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0160, loss: 0.7596, batch_reg_loss: 0.0974, reg_loss: 0.0971 ||: 22%|##1 | 24/111 [00:15<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9385, LAS: 0.8795, UEM: 0.5779, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6153, partial_loss/deprel_loss: 0.8072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8663, loss: 0.7663, batch_reg_loss: 0.0974, reg_loss: 0.0972 ||: 24%|##4 | 27/111 [00:17<00:57, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9341, LAS: 0.8746, UEM: 0.5516, LEM: 0.2868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8354, partial_loss/deprel_loss: 1.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4926, loss: 0.8122, batch_reg_loss: 0.0975, reg_loss: 0.0972 ||: 28%|##7 | 31/111 [00:20<00:53, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8138, UAS: 0.9303, LAS: 0.8703, UEM: 0.5369, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3798, partial_loss/deprel_loss: 1.2360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3623, loss: 0.8503, batch_reg_loss: 0.0976, reg_loss: 0.0972 ||: 32%|###1 | 35/111 [00:22<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9314, LAS: 0.8718, UEM: 0.5791, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6164, loss: 0.8361, batch_reg_loss: 0.0976, reg_loss: 0.0973 ||: 34%|###4 | 38/111 [00:25<00:55, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9312, LAS: 0.8709, UEM: 0.5703, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7824, loss: 0.8412, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||: 37%|###6 | 41/111 [00:27<00:52, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9275, LAS: 0.8665, UEM: 0.5581, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.7415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.8770, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||: 40%|###9 | 44/111 [00:29<00:48, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9283, LAS: 0.8671, UEM: 0.5570, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4666, partial_loss/deprel_loss: 0.6955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.8715, batch_reg_loss: 0.0978, reg_loss: 0.0974 ||: 43%|####3 | 48/111 [00:32<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9256, LAS: 0.8640, UEM: 0.5457, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4119, partial_loss/deprel_loss: 0.5915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6535, loss: 0.8893, batch_reg_loss: 0.0979, reg_loss: 0.0974 ||: 47%|####6 | 52/111 [00:35<00:40, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9268, LAS: 0.8653, UEM: 0.5666, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1844, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4296, loss: 0.8788, batch_reg_loss: 0.0980, reg_loss: 0.0974 ||: 50%|####9 | 55/111 [00:37<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9261, LAS: 0.8643, UEM: 0.5619, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5270, loss: 0.8857, batch_reg_loss: 0.0981, reg_loss: 0.0975 ||: 53%|#####3 | 59/111 [00:39<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7876, UAS: 0.9239, LAS: 0.8618, UEM: 0.5473, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7525, partial_loss/deprel_loss: 1.3168, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5021, loss: 0.9059, batch_reg_loss: 0.0982, reg_loss: 0.0975 ||: 57%|#####6 | 63/111 [00:42<00:32, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8164, UAS: 0.9234, LAS: 0.8610, UEM: 0.5373, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3867, partial_loss/deprel_loss: 1.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2997, loss: 0.9142, batch_reg_loss: 0.0982, reg_loss: 0.0976 ||: 59%|#####9 | 66/111 [00:44<00:30, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9236, LAS: 0.8612, UEM: 0.5420, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4252, partial_loss/deprel_loss: 1.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4806, loss: 0.9127, batch_reg_loss: 0.0983, reg_loss: 0.0976 ||: 62%|######2 | 69/111 [00:47<00:30, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9236, LAS: 0.8613, UEM: 0.5379, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5400, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7313, loss: 0.9139, batch_reg_loss: 0.0984, reg_loss: 0.0976 ||: 65%|######4 | 72/111 [00:49<00:28, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9226, LAS: 0.8598, UEM: 0.5300, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.7197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7784, loss: 0.9243, batch_reg_loss: 0.0985, reg_loss: 0.0977 ||: 68%|######8 | 76/111 [00:51<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9214, LAS: 0.8586, UEM: 0.5237, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7298, partial_loss/deprel_loss: 0.7075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8105, loss: 0.9339, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||: 72%|#######2 | 80/111 [00:54<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9218, LAS: 0.8591, UEM: 0.5252, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5913, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8066, loss: 0.9308, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9213, LAS: 0.8584, UEM: 0.5176, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4704, partial_loss/deprel_loss: 1.1766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3341, loss: 0.9378, batch_reg_loss: 0.0987, reg_loss: 0.0978 ||: 78%|#######8 | 87/111 [00:59<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7587, UAS: 0.9197, LAS: 0.8566, UEM: 0.5081, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3102, partial_loss/deprel_loss: 1.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8557, loss: 0.9530, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 82%|########1 | 91/111 [01:01<00:13, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9189, LAS: 0.8555, UEM: 0.4985, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2651, partial_loss/deprel_loss: 1.0647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2037, loss: 0.9623, batch_reg_loss: 0.0989, reg_loss: 0.0979 ||: 86%|########5 | 95/111 [01:04<00:10, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9190, LAS: 0.8555, UEM: 0.4983, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5153, partial_loss/deprel_loss: 0.7901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8342, loss: 0.9627, batch_reg_loss: 0.0990, reg_loss: 0.0979 ||: 89%|########9 | 99/111 [01:06<00:07, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9191, LAS: 0.8558, UEM: 0.5012, LEM: 0.2698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7918, loss: 0.9603, batch_reg_loss: 0.0991, reg_loss: 0.0980 ||: 93%|#########2| 103/111 [01:09<00:05, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9187, LAS: 0.8553, UEM: 0.5018, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8508, partial_loss/deprel_loss: 0.9035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9639, batch_reg_loss: 0.0992, reg_loss: 0.0980 ||: 96%|#########6| 107/111 [01:11<00:02, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.693 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.439 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - reg_loss | 0.098 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UEM | 0.504 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LAS | 0.856 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - loss | 0.955 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEM | 0.269 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UAS | 0.920 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EM | 0.880 | N/A\n", + "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Epoch duration: 0:01:14.210037\n", + "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Estimated training time remaining: 8:17:12\n", + "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Epoch 23/399\n", + "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:20:07,334 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:20:07,340 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.8949, LAS: 0.8287, UEM: 0.1098, LEM: 0.0122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1080, partial_loss/deprel_loss: 1.0936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1958, loss: 1.2573, batch_reg_loss: 0.0994, reg_loss: 0.0993 ||: 3%|2 | 3/111 [00:02<01:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9162, LAS: 0.8520, UEM: 0.4313, LEM: 0.1854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 0.9522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0594, loss: 1.0167, batch_reg_loss: 0.0994, reg_loss: 0.0994 ||: 5%|5 | 6/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9208, LAS: 0.8586, UEM: 0.4514, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4497, partial_loss/deprel_loss: 0.7025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.9521, batch_reg_loss: 0.0995, reg_loss: 0.0994 ||: 9%|9 | 10/111 [00:06<01:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9220, LAS: 0.8594, UEM: 0.4382, LEM: 0.1919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5719, partial_loss/deprel_loss: 0.6911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7669, loss: 0.9378, batch_reg_loss: 0.0996, reg_loss: 0.0994 ||: 12%|#1 | 13/111 [00:08<01:05, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8195, UAS: 0.9152, LAS: 0.8517, UEM: 0.4119, LEM: 0.1816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2872, loss: 1.0058, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||: 15%|#5 | 17/111 [00:11<01:02, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9212, LAS: 0.8597, UEM: 0.5133, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.9357, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||: 18%|#8 | 20/111 [00:13<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7982, UAS: 0.9195, LAS: 0.8577, UEM: 0.4810, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6368, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4579, loss: 0.9546, batch_reg_loss: 0.0998, reg_loss: 0.0996 ||: 22%|##1 | 24/111 [00:16<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9207, LAS: 0.8587, UEM: 0.4830, LEM: 0.2536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7993, partial_loss/deprel_loss: 0.8640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9510, loss: 0.9487, batch_reg_loss: 0.0999, reg_loss: 0.0996 ||: 24%|##4 | 27/111 [00:18<00:57, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9174, LAS: 0.8551, UEM: 0.4849, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2721, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.9817, batch_reg_loss: 0.1000, reg_loss: 0.0996 ||: 27%|##7 | 30/111 [00:20<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9170, LAS: 0.8551, UEM: 0.4742, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2339, partial_loss/deprel_loss: 1.1452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2630, loss: 0.9804, batch_reg_loss: 0.1000, reg_loss: 0.0997 ||: 30%|##9 | 33/111 [00:22<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9191, LAS: 0.8576, UEM: 0.5179, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4324, loss: 0.9551, batch_reg_loss: 0.1001, reg_loss: 0.0997 ||: 32%|###2 | 36/111 [00:24<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9208, LAS: 0.8592, UEM: 0.5176, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3242, partial_loss/deprel_loss: 0.5435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.9375, batch_reg_loss: 0.1002, reg_loss: 0.0998 ||: 36%|###6 | 40/111 [00:27<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9215, LAS: 0.8597, UEM: 0.5178, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4017, partial_loss/deprel_loss: 0.5735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.9290, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||: 39%|###8 | 43/111 [00:29<00:47, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9230, LAS: 0.8616, UEM: 0.5530, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0951, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3023, loss: 0.9164, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||: 41%|####1 | 46/111 [00:31<00:48, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9233, LAS: 0.8621, UEM: 0.5553, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4974, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7402, loss: 0.9117, batch_reg_loss: 0.1004, reg_loss: 0.0999 ||: 44%|####4 | 49/111 [00:34<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8017, UAS: 0.9220, LAS: 0.8608, UEM: 0.5543, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5379, partial_loss/deprel_loss: 1.2708, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4247, loss: 0.9204, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||: 48%|####7 | 53/111 [00:36<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9218, LAS: 0.8605, UEM: 0.5487, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3058, partial_loss/deprel_loss: 0.5159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5744, loss: 0.9219, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||: 50%|##### | 56/111 [00:38<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9226, LAS: 0.8614, UEM: 0.5549, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.4572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.9170, batch_reg_loss: 0.1006, reg_loss: 0.1000 ||: 53%|#####3 | 59/111 [00:41<00:38, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5563, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.6772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.9111, batch_reg_loss: 0.1007, reg_loss: 0.1000 ||: 56%|#####5 | 62/111 [00:43<00:36, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9238, LAS: 0.8623, UEM: 0.5494, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4779, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9075, batch_reg_loss: 0.1008, reg_loss: 0.1000 ||: 59%|#####9 | 66/111 [00:46<00:32, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9234, LAS: 0.8620, UEM: 0.5454, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9666, partial_loss/deprel_loss: 0.9580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0606, loss: 0.9100, batch_reg_loss: 0.1008, reg_loss: 0.1001 ||: 62%|######2 | 69/111 [00:48<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9209, LAS: 0.8594, UEM: 0.5390, LEM: 0.3046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.8047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9318, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||: 65%|######4 | 72/111 [00:50<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9218, LAS: 0.8603, UEM: 0.5415, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6952, partial_loss/deprel_loss: 0.8219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8975, loss: 0.9227, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||: 68%|######7 | 75/111 [00:52<00:26, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9209, LAS: 0.8591, UEM: 0.5355, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5396, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7220, loss: 0.9309, batch_reg_loss: 0.1010, reg_loss: 0.1002 ||: 71%|#######1 | 79/111 [00:55<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9214, LAS: 0.8597, UEM: 0.5347, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6287, loss: 0.9262, batch_reg_loss: 0.1011, reg_loss: 0.1002 ||: 74%|#######3 | 82/111 [00:57<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9216, LAS: 0.8599, UEM: 0.5292, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1648, partial_loss/deprel_loss: 1.1497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2539, loss: 0.9257, batch_reg_loss: 0.1012, reg_loss: 0.1003 ||: 77%|#######7 | 86/111 [00:59<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9212, LAS: 0.8595, UEM: 0.5286, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1797, partial_loss/deprel_loss: 1.0297, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1609, loss: 0.9283, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||: 80%|######## | 89/111 [01:02<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9205, LAS: 0.8586, UEM: 0.5206, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8560, partial_loss/deprel_loss: 0.8923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9864, loss: 0.9342, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||: 83%|########2 | 92/111 [01:04<00:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9196, LAS: 0.8574, UEM: 0.5135, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8253, partial_loss/deprel_loss: 0.8840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9737, loss: 0.9429, batch_reg_loss: 0.1014, reg_loss: 0.1004 ||: 86%|########5 | 95/111 [01:06<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9202, LAS: 0.8579, UEM: 0.5121, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4252, partial_loss/deprel_loss: 0.6383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9379, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||: 88%|########8 | 98/111 [01:08<00:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9202, LAS: 0.8578, UEM: 0.5151, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.9367, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||: 91%|######### | 101/111 [01:10<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9204, LAS: 0.8580, UEM: 0.5113, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5823, partial_loss/deprel_loss: 0.7403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8103, loss: 0.9358, batch_reg_loss: 0.1016, reg_loss: 0.1005 ||: 94%|#########3| 104/111 [01:13<00:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9201, LAS: 0.8575, UEM: 0.5075, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3702, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2781, loss: 0.9388, batch_reg_loss: 0.1017, reg_loss: 0.1005 ||: 96%|#########6| 107/111 [01:15<00:02, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.701 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.553 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - reg_loss | 0.101 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UEM | 0.503 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LAS | 0.857 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - loss | 0.942 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEM | 0.268 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UAS | 0.920 | N/A\n", + "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - EM | 0.879 | N/A\n", + "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Epoch duration: 0:01:17.771978\n", + "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Estimated training time remaining: 8:15:32\n", + "2023-04-06 23:21:25,105 - INFO - allennlp.training.trainer - Epoch 24/399\n", + "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:21:25,112 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9498, LAS: 0.8965, UEM: 0.6134, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4244, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6136, loss: 0.6403, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||: 3%|2 | 3/111 [00:02<01:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9222, LAS: 0.8663, UEM: 0.5378, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0726, partial_loss/deprel_loss: 1.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5262, loss: 0.8804, batch_reg_loss: 0.1019, reg_loss: 0.1018 ||: 5%|5 | 6/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9254, LAS: 0.8696, UEM: 0.5613, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.8574, batch_reg_loss: 0.1020, reg_loss: 0.1019 ||: 8%|8 | 9/111 [00:06<01:13, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9290, LAS: 0.8697, UEM: 0.5375, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5027, partial_loss/deprel_loss: 0.7213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.8491, batch_reg_loss: 0.1021, reg_loss: 0.1019 ||: 12%|#1 | 13/111 [00:08<01:05, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8115, UAS: 0.9180, LAS: 0.8568, UEM: 0.4769, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3171, partial_loss/deprel_loss: 1.1869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3151, loss: 0.9530, batch_reg_loss: 0.1021, reg_loss: 0.1020 ||: 15%|#5 | 17/111 [00:11<01:01, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9202, LAS: 0.8585, UEM: 0.4617, LEM: 0.2124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.6378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.9386, batch_reg_loss: 0.1022, reg_loss: 0.1020 ||: 19%|#8 | 21/111 [00:13<00:57, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9191, LAS: 0.8573, UEM: 0.4431, LEM: 0.1985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8136, loss: 0.9558, batch_reg_loss: 0.1023, reg_loss: 0.1020 ||: 22%|##1 | 24/111 [00:15<00:57, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9207, LAS: 0.8589, UEM: 0.4550, LEM: 0.2127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7988, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.9407, batch_reg_loss: 0.1024, reg_loss: 0.1021 ||: 25%|##5 | 28/111 [00:18<00:54, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9219, LAS: 0.8599, UEM: 0.4545, LEM: 0.2086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9907, partial_loss/deprel_loss: 0.9659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0733, loss: 0.9309, batch_reg_loss: 0.1025, reg_loss: 0.1021 ||: 28%|##7 | 31/111 [00:20<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8286, UAS: 0.9239, LAS: 0.8630, UEM: 0.5199, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1700, partial_loss/deprel_loss: 1.1138, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2275, loss: 0.9088, batch_reg_loss: 0.1025, reg_loss: 0.1022 ||: 31%|### | 34/111 [00:22<00:55, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9237, LAS: 0.8628, UEM: 0.5208, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3895, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9085, batch_reg_loss: 0.1026, reg_loss: 0.1022 ||: 34%|###4 | 38/111 [00:25<00:50, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9219, LAS: 0.8612, UEM: 0.5116, LEM: 0.2786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6607, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8475, loss: 0.9216, batch_reg_loss: 0.1027, reg_loss: 0.1022 ||: 38%|###7 | 42/111 [00:27<00:45, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7785, UAS: 0.9207, LAS: 0.8600, UEM: 0.5061, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8828, partial_loss/deprel_loss: 1.4185, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6141, loss: 0.9324, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||: 41%|####1 | 46/111 [00:30<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9206, LAS: 0.8598, UEM: 0.4985, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5178, partial_loss/deprel_loss: 1.2824, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4323, loss: 0.9363, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||: 45%|####5 | 50/111 [00:33<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9225, LAS: 0.8620, UEM: 0.5273, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.9186, batch_reg_loss: 0.1029, reg_loss: 0.1024 ||: 48%|####7 | 53/111 [00:35<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9225, LAS: 0.8617, UEM: 0.5194, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.7654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.9208, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||: 50%|##### | 56/111 [00:37<00:37, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9223, LAS: 0.8611, UEM: 0.5155, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.6492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9261, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||: 53%|#####3 | 59/111 [00:39<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9211, LAS: 0.8598, UEM: 0.5063, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7221, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8899, loss: 0.9367, batch_reg_loss: 0.1031, reg_loss: 0.1025 ||: 56%|#####5 | 62/111 [00:41<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9183, LAS: 0.8566, UEM: 0.4943, LEM: 0.2676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0037, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0858, loss: 0.9632, batch_reg_loss: 0.1032, reg_loss: 0.1025 ||: 59%|#####9 | 66/111 [00:44<00:30, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9178, LAS: 0.8557, UEM: 0.4850, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1411, partial_loss/deprel_loss: 1.1626, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2616, loss: 0.9685, batch_reg_loss: 0.1033, reg_loss: 0.1025 ||: 63%|######3 | 70/111 [00:46<00:27, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9189, LAS: 0.8569, UEM: 0.4977, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.9568, batch_reg_loss: 0.1034, reg_loss: 0.1026 ||: 67%|######6 | 74/111 [00:49<00:24, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9177, LAS: 0.8557, UEM: 0.4966, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6101, partial_loss/deprel_loss: 1.1479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3438, loss: 0.9684, batch_reg_loss: 0.1035, reg_loss: 0.1026 ||: 69%|######9 | 77/111 [00:51<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9174, LAS: 0.8554, UEM: 0.4877, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8433, loss: 0.9711, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||: 73%|#######2 | 81/111 [00:54<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9177, LAS: 0.8554, UEM: 0.4819, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.7612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8219, loss: 0.9704, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||: 77%|#######6 | 85/111 [00:56<00:16, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9183, LAS: 0.8559, UEM: 0.4814, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6801, partial_loss/deprel_loss: 0.8225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 0.9660, batch_reg_loss: 0.1037, reg_loss: 0.1028 ||: 80%|######## | 89/111 [00:59<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9192, LAS: 0.8571, UEM: 0.4872, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.6416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7345, loss: 0.9550, batch_reg_loss: 0.1038, reg_loss: 0.1028 ||: 84%|########3 | 93/111 [01:01<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9200, LAS: 0.8581, UEM: 0.4941, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.9464, batch_reg_loss: 0.1039, reg_loss: 0.1028 ||: 87%|########7 | 97/111 [01:05<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9204, LAS: 0.8585, UEM: 0.5007, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.5752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6458, loss: 0.9437, batch_reg_loss: 0.1040, reg_loss: 0.1029 ||: 91%|######### | 101/111 [01:07<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9208, LAS: 0.8587, UEM: 0.5012, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3307, partial_loss/deprel_loss: 0.5607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6188, loss: 0.9398, batch_reg_loss: 0.1041, reg_loss: 0.1029 ||: 94%|#########3| 104/111 [01:10<00:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9209, LAS: 0.8588, UEM: 0.4988, LEM: 0.2634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5770, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7704, loss: 0.9390, batch_reg_loss: 0.1041, reg_loss: 0.1030 ||: 96%|#########6| 107/111 [01:12<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7959, UAS: 0.9205, LAS: 0.8584, UEM: 0.5038, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6188, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5033, loss: 0.9428, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||: 99%|#########9| 110/111 [01:14<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9208, LAS: 0.8587, UEM: 0.5047, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3658, partial_loss/deprel_loss: 0.5668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.9400, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||: 100%|##########| 111/111 [01:15<00:00, 1.48it/s]\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.567 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.366 | N/A\n", + "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - reg_loss | 0.103 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UEM | 0.505 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LAS | 0.859 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - loss | 0.940 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEM | 0.270 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UAS | 0.921 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EM | 0.892 | N/A\n", + "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Epoch duration: 0:01:15.208139\n", + "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Estimated training time remaining: 8:13:15\n", + "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Epoch 25/399\n", + "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:22:40,320 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9344, LAS: 0.8797, UEM: 0.4935, LEM: 0.2495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6547, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8849, loss: 0.7391, batch_reg_loss: 0.1042, reg_loss: 0.1042 ||: 3%|2 | 3/111 [00:02<01:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9349, LAS: 0.8766, UEM: 0.4955, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 1.0617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.7907, batch_reg_loss: 0.1043, reg_loss: 0.1043 ||: 5%|5 | 6/111 [00:04<01:13, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9163, LAS: 0.8558, UEM: 0.4640, LEM: 0.2246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3905, partial_loss/deprel_loss: 1.1573, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3083, loss: 0.9494, batch_reg_loss: 0.1044, reg_loss: 0.1043 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9227, LAS: 0.8621, UEM: 0.4577, LEM: 0.2099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4299, partial_loss/deprel_loss: 0.6033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6731, loss: 0.9065, batch_reg_loss: 0.1045, reg_loss: 0.1043 ||: 13%|#2 | 14/111 [00:09<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9247, LAS: 0.8645, UEM: 0.4702, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6388, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8534, loss: 0.8863, batch_reg_loss: 0.1045, reg_loss: 0.1044 ||: 15%|#5 | 17/111 [00:11<01:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9276, LAS: 0.8682, UEM: 0.5241, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8834, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0513, loss: 0.8611, batch_reg_loss: 0.1046, reg_loss: 0.1044 ||: 18%|#8 | 20/111 [00:14<01:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8113, UAS: 0.9243, LAS: 0.8644, UEM: 0.4944, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5374, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3084, loss: 0.8922, batch_reg_loss: 0.1047, reg_loss: 0.1044 ||: 21%|## | 23/111 [00:16<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9286, LAS: 0.8690, UEM: 0.5379, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.5448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8552, batch_reg_loss: 0.1047, reg_loss: 0.1045 ||: 23%|##3 | 26/111 [00:18<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7784, UAS: 0.9271, LAS: 0.8676, UEM: 0.5357, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1583, partial_loss/deprel_loss: 1.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6182, loss: 0.8713, batch_reg_loss: 0.1048, reg_loss: 0.1045 ||: 27%|##7 | 30/111 [00:20<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9281, LAS: 0.8688, UEM: 0.5477, LEM: 0.3002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5381, loss: 0.8613, batch_reg_loss: 0.1049, reg_loss: 0.1045 ||: 30%|##9 | 33/111 [00:22<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9289, LAS: 0.8693, UEM: 0.5395, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3442, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.8581, batch_reg_loss: 0.1049, reg_loss: 0.1046 ||: 32%|###2 | 36/111 [00:24<00:51, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8346, UAS: 0.9285, LAS: 0.8688, UEM: 0.5242, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 1.0839, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2047, loss: 0.8636, batch_reg_loss: 0.1050, reg_loss: 0.1046 ||: 36%|###6 | 40/111 [00:27<00:47, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7681, UAS: 0.9278, LAS: 0.8681, UEM: 0.5437, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1504, partial_loss/deprel_loss: 1.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6852, loss: 0.8681, batch_reg_loss: 0.1051, reg_loss: 0.1046 ||: 39%|###8 | 43/111 [00:29<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9259, LAS: 0.8659, UEM: 0.5305, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8139, loss: 0.8856, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||: 42%|####2 | 47/111 [00:32<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9249, LAS: 0.8648, UEM: 0.5189, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6368, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8225, loss: 0.8922, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||: 45%|####5 | 50/111 [00:34<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9257, LAS: 0.8655, UEM: 0.5205, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.6185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.8873, batch_reg_loss: 0.1053, reg_loss: 0.1047 ||: 48%|####7 | 53/111 [00:36<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9251, LAS: 0.8652, UEM: 0.5197, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8925, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||: 50%|##### | 56/111 [00:38<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9268, LAS: 0.8674, UEM: 0.5477, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4947, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7941, loss: 0.8777, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||: 53%|#####3 | 59/111 [00:41<00:39, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8073, UAS: 0.9261, LAS: 0.8666, UEM: 0.5477, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.1254, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3354, loss: 0.8834, batch_reg_loss: 0.1055, reg_loss: 0.1048 ||: 56%|#####5 | 62/111 [00:43<00:36, 1.33it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9259, LAS: 0.8663, UEM: 0.5460, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.8849, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||: 59%|#####9 | 66/111 [00:46<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8236, UAS: 0.9236, LAS: 0.8636, UEM: 0.5365, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2846, partial_loss/deprel_loss: 1.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2725, loss: 0.9055, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||: 62%|######2 | 69/111 [00:48<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8148, UAS: 0.9225, LAS: 0.8623, UEM: 0.5268, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3223, partial_loss/deprel_loss: 1.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3767, loss: 0.9208, batch_reg_loss: 0.1057, reg_loss: 0.1050 ||: 65%|######4 | 72/111 [00:50<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.9220, LAS: 0.8616, UEM: 0.5317, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9413, partial_loss/deprel_loss: 1.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6091, loss: 0.9239, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||: 68%|######7 | 75/111 [00:52<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9222, LAS: 0.8616, UEM: 0.5255, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7652, partial_loss/deprel_loss: 0.8632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.9231, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||: 70%|####### | 78/111 [00:54<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9232, LAS: 0.8625, UEM: 0.5251, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 0.7356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7857, loss: 0.9174, batch_reg_loss: 0.1059, reg_loss: 0.1050 ||: 73%|#######2 | 81/111 [00:56<00:21, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9231, LAS: 0.8623, UEM: 0.5156, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1543, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2341, loss: 0.9186, batch_reg_loss: 0.1060, reg_loss: 0.1051 ||: 77%|#######6 | 85/111 [00:59<00:17, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9238, LAS: 0.8630, UEM: 0.5193, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5677, loss: 0.9128, batch_reg_loss: 0.1061, reg_loss: 0.1051 ||: 80%|######## | 89/111 [01:01<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9241, LAS: 0.8633, UEM: 0.5179, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0860, partial_loss/deprel_loss: 1.0809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1880, loss: 0.9103, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||: 83%|########2 | 92/111 [01:04<00:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8234, UAS: 0.9244, LAS: 0.8636, UEM: 0.5232, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2385, partial_loss/deprel_loss: 1.0176, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1680, loss: 0.9053, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||: 86%|########6 | 96/111 [01:06<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9233, LAS: 0.8623, UEM: 0.5169, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8967, partial_loss/deprel_loss: 0.9467, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0430, loss: 0.9148, batch_reg_loss: 0.1063, reg_loss: 0.1052 ||: 89%|########9 | 99/111 [01:08<00:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9238, LAS: 0.8630, UEM: 0.5188, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.5105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.9090, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||: 92%|#########1| 102/111 [01:11<00:06, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9231, LAS: 0.8623, UEM: 0.5110, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7957, partial_loss/deprel_loss: 0.8864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.9154, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||: 95%|#########5| 106/111 [01:14<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7423, UAS: 0.9219, LAS: 0.8609, UEM: 0.5056, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8168, partial_loss/deprel_loss: 1.8275, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1319, loss: 0.9278, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||: 99%|#########9| 110/111 [01:16<00:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9221, LAS: 0.8612, UEM: 0.5086, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.9250, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:23:58,213 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9630, LAS: 0.9177, UEM: 0.8159, LEM: 0.5815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1737, partial_loss/deprel_loss: 20.5474, partial_loss/cycle_loss: 0.0000, batch_loss: 16.4726, loss: 21.0144, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9472, LAS: 0.8955, UEM: 0.7141, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0153, partial_loss/deprel_loss: 43.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9080, loss: 25.5731, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:07, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9444, LAS: 0.8901, UEM: 0.6600, LEM: 0.4105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7415, partial_loss/deprel_loss: 29.8373, partial_loss/cycle_loss: 0.0000, batch_loss: 24.0182, loss: 24.7509, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9442, LAS: 0.8901, UEM: 0.6403, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 17.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 14.1877, loss: 24.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.06it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9410, LAS: 0.8860, UEM: 0.6232, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 24.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6684, loss: 25.9867, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.06it/s]\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.551 | 24.486\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.323 | 0.398\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - reg_loss | 0.105 | 0.000\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UEM | 0.509 | 0.623\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LAS | 0.861 | 0.886\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - loss | 0.925 | 25.987\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LEM | 0.275 | 0.362\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - UAS | 0.922 | 0.941\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EM | 0.893 | 0.904\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Epoch duration: 0:01:30.221589\n", + "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Estimated training time remaining: 8:14:38\n", + "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Epoch 26/399\n", + "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:24:10,542 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9545, LAS: 0.9014, UEM: 0.6867, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.6380, batch_reg_loss: 0.1066, reg_loss: 0.1066 ||: 3%|2 | 3/111 [00:02<01:20, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9292, LAS: 0.8709, UEM: 0.5445, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7835, partial_loss/deprel_loss: 0.8604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9517, loss: 0.8619, batch_reg_loss: 0.1067, reg_loss: 0.1066 ||: 6%|6 | 7/111 [00:04<01:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9296, LAS: 0.8722, UEM: 0.6059, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1357, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3499, loss: 0.8487, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||: 9%|9 | 10/111 [00:07<01:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9257, LAS: 0.8661, UEM: 0.5670, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8304, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9389, loss: 0.8925, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||: 13%|#2 | 14/111 [00:09<01:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5243, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5089, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8100, loss: 0.9244, batch_reg_loss: 0.1069, reg_loss: 0.1068 ||: 16%|#6 | 18/111 [00:11<01:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9243, LAS: 0.8631, UEM: 0.5139, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.5236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.9069, batch_reg_loss: 0.1070, reg_loss: 0.1068 ||: 19%|#8 | 21/111 [00:14<01:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9241, LAS: 0.8641, UEM: 0.5164, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.9046, batch_reg_loss: 0.1071, reg_loss: 0.1068 ||: 23%|##2 | 25/111 [00:16<00:57, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9258, LAS: 0.8660, UEM: 0.5084, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.8859, batch_reg_loss: 0.1072, reg_loss: 0.1069 ||: 26%|##6 | 29/111 [00:19<00:55, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9258, LAS: 0.8655, UEM: 0.5043, LEM: 0.2665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2740, partial_loss/deprel_loss: 0.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.8904, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||: 30%|##9 | 33/111 [00:21<00:51, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9282, LAS: 0.8682, UEM: 0.5457, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8672, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||: 32%|###2 | 36/111 [00:23<00:49, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9276, LAS: 0.8675, UEM: 0.5649, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3104, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5757, loss: 0.8686, batch_reg_loss: 0.1074, reg_loss: 0.1070 ||: 35%|###5 | 39/111 [00:26<00:48, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9282, LAS: 0.8683, UEM: 0.5682, LEM: 0.3254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.4289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4971, loss: 0.8663, batch_reg_loss: 0.1075, reg_loss: 0.1070 ||: 39%|###8 | 43/111 [00:28<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9305, LAS: 0.8712, UEM: 0.5994, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3668, partial_loss/deprel_loss: 0.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.8445, batch_reg_loss: 0.1075, reg_loss: 0.1071 ||: 42%|####2 | 47/111 [00:31<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9285, LAS: 0.8689, UEM: 0.5846, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8792, partial_loss/deprel_loss: 0.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0116, loss: 0.8637, batch_reg_loss: 0.1076, reg_loss: 0.1071 ||: 46%|####5 | 51/111 [00:33<00:39, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9282, LAS: 0.8684, UEM: 0.5741, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4152, partial_loss/deprel_loss: 0.6219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6883, loss: 0.8696, batch_reg_loss: 0.1077, reg_loss: 0.1071 ||: 50%|####9 | 55/111 [00:36<00:36, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9289, LAS: 0.8689, UEM: 0.5806, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8649, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||: 53%|#####3 | 59/111 [00:39<00:35, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8305, UAS: 0.9287, LAS: 0.8687, UEM: 0.5776, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1911, partial_loss/deprel_loss: 1.0662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1991, loss: 0.8640, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||: 56%|#####5 | 62/111 [00:41<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9283, LAS: 0.8684, UEM: 0.5685, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0422, partial_loss/deprel_loss: 0.9557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0810, loss: 0.8660, batch_reg_loss: 0.1079, reg_loss: 0.1073 ||: 59%|#####9 | 66/111 [00:43<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9273, LAS: 0.8673, UEM: 0.5602, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.8741, batch_reg_loss: 0.1080, reg_loss: 0.1073 ||: 63%|######3 | 70/111 [00:46<00:27, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9263, LAS: 0.8659, UEM: 0.5479, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.7782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8876, loss: 0.8835, batch_reg_loss: 0.1081, reg_loss: 0.1073 ||: 67%|######6 | 74/111 [00:48<00:23, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9263, LAS: 0.8660, UEM: 0.5435, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8610, partial_loss/deprel_loss: 0.9041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0036, loss: 0.8832, batch_reg_loss: 0.1082, reg_loss: 0.1074 ||: 70%|####### | 78/111 [00:51<00:21, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9239, LAS: 0.8632, UEM: 0.5339, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0083, partial_loss/deprel_loss: 0.9057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0345, loss: 0.9074, batch_reg_loss: 0.1083, reg_loss: 0.1074 ||: 74%|#######3 | 82/111 [00:54<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9232, LAS: 0.8625, UEM: 0.5256, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.9146, batch_reg_loss: 0.1083, reg_loss: 0.1075 ||: 77%|#######7 | 86/111 [00:57<00:16, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9209, LAS: 0.8601, UEM: 0.5163, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1256, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1181, loss: 0.9341, batch_reg_loss: 0.1084, reg_loss: 0.1075 ||: 81%|########1 | 90/111 [00:59<00:14, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9218, LAS: 0.8611, UEM: 0.5218, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3100, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5793, loss: 0.9257, batch_reg_loss: 0.1085, reg_loss: 0.1075 ||: 84%|########3 | 93/111 [01:02<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9222, LAS: 0.8613, UEM: 0.5183, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5588, partial_loss/deprel_loss: 0.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7451, loss: 0.9237, batch_reg_loss: 0.1086, reg_loss: 0.1076 ||: 86%|########6 | 96/111 [01:04<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9224, LAS: 0.8615, UEM: 0.5172, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0468, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1242, loss: 0.9211, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||: 90%|######### | 100/111 [01:06<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9214, LAS: 0.8605, UEM: 0.5132, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4873, partial_loss/deprel_loss: 0.6853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.9311, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||: 93%|#########2| 103/111 [01:08<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9221, LAS: 0.8612, UEM: 0.5180, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7112, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.9247, batch_reg_loss: 0.1088, reg_loss: 0.1077 ||: 95%|#########5| 106/111 [01:11<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9214, LAS: 0.8602, UEM: 0.5101, LEM: 0.2792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2259, partial_loss/deprel_loss: 1.2003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3143, loss: 0.9326, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||: 99%|#########9| 110/111 [01:13<00:00, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9217, LAS: 0.8605, UEM: 0.5109, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3606, partial_loss/deprel_loss: 0.6149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.9302, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-06 23:25:25,100 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.615 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.361 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - reg_loss | 0.108 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UEM | 0.511 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - LAS | 0.861 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - loss | 0.930 | N/A\n", + "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEM | 0.279 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - UAS | 0.922 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EM | 0.898 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:25:25,102 - INFO - combo.training.trainer - Epoch duration: 0:01:14.566974\n", + "2023-04-06 23:25:25,103 - INFO - combo.training.trainer - Estimated training time remaining: 8:12:13\n", + "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Epoch 27/399\n", + "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:25:25,110 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8523, UAS: 0.9369, LAS: 0.8747, UEM: 0.5058, LEM: 0.2442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8675, partial_loss/deprel_loss: 1.0086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8187, batch_reg_loss: 0.1090, reg_loss: 0.1090 ||: 4%|3 | 4/111 [00:02<01:07, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9336, LAS: 0.8740, UEM: 0.5125, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.8310, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||: 7%|7 | 8/111 [00:05<01:06, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.9243, LAS: 0.8646, UEM: 0.5087, LEM: 0.2633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3445, partial_loss/deprel_loss: 1.1262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2790, loss: 0.9138, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||: 10%|9 | 11/111 [00:07<01:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9269, LAS: 0.8667, UEM: 0.5467, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 1.0002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0854, loss: 0.8886, batch_reg_loss: 0.1092, reg_loss: 0.1091 ||: 13%|#2 | 14/111 [00:09<01:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9294, LAS: 0.8700, UEM: 0.5552, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||: 15%|#5 | 17/111 [00:11<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9265, LAS: 0.8674, UEM: 0.5617, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5139, loss: 0.8870, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||: 19%|#8 | 21/111 [00:14<01:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8317, UAS: 0.9271, LAS: 0.8678, UEM: 0.5447, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1042, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8804, batch_reg_loss: 0.1094, reg_loss: 0.1092 ||: 23%|##2 | 25/111 [00:16<00:55, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9287, LAS: 0.8691, UEM: 0.5503, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.8661, batch_reg_loss: 0.1095, reg_loss: 0.1092 ||: 26%|##6 | 29/111 [00:19<00:52, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9292, LAS: 0.8690, UEM: 0.5347, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.8093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8878, loss: 0.8647, batch_reg_loss: 0.1096, reg_loss: 0.1093 ||: 30%|##9 | 33/111 [00:21<00:49, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7760, UAS: 0.9264, LAS: 0.8662, UEM: 0.5149, LEM: 0.2670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9272, partial_loss/deprel_loss: 1.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6282, loss: 0.8847, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||: 33%|###3 | 37/111 [00:24<00:46, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9237, LAS: 0.8637, UEM: 0.5148, LEM: 0.2693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4669, partial_loss/deprel_loss: 1.0744, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2626, loss: 0.9017, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||: 37%|###6 | 41/111 [00:27<00:47, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9233, LAS: 0.8630, UEM: 0.5048, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.7383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8181, loss: 0.9055, batch_reg_loss: 0.1098, reg_loss: 0.1094 ||: 41%|#### | 45/111 [00:29<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9229, LAS: 0.8620, UEM: 0.4906, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1077, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2009, loss: 0.9135, batch_reg_loss: 0.1099, reg_loss: 0.1094 ||: 44%|####4 | 49/111 [00:32<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8291, UAS: 0.9227, LAS: 0.8618, UEM: 0.4889, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1882, partial_loss/deprel_loss: 1.1634, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2784, loss: 0.9169, batch_reg_loss: 0.1100, reg_loss: 0.1095 ||: 48%|####7 | 53/111 [00:35<00:38, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9214, LAS: 0.8604, UEM: 0.5006, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1371, partial_loss/deprel_loss: 0.2988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.9293, batch_reg_loss: 0.1101, reg_loss: 0.1095 ||: 51%|#####1 | 57/111 [00:37<00:35, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9216, LAS: 0.8607, UEM: 0.4967, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3575, partial_loss/deprel_loss: 1.1842, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3291, loss: 0.9275, batch_reg_loss: 0.1102, reg_loss: 0.1095 ||: 55%|#####4 | 61/111 [00:40<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9224, LAS: 0.8614, UEM: 0.4990, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.6425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.9222, batch_reg_loss: 0.1103, reg_loss: 0.1096 ||: 59%|#####8 | 65/111 [00:43<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9221, LAS: 0.8608, UEM: 0.4882, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.7200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8027, loss: 0.9284, batch_reg_loss: 0.1104, reg_loss: 0.1096 ||: 62%|######2 | 69/111 [00:45<00:27, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9217, LAS: 0.8602, UEM: 0.4867, LEM: 0.2522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4043, partial_loss/deprel_loss: 1.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4138, loss: 0.9343, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||: 66%|######5 | 73/111 [00:48<00:25, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9218, LAS: 0.8604, UEM: 0.4876, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1732, partial_loss/deprel_loss: 1.1097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2329, loss: 0.9349, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||: 68%|######8 | 76/111 [00:50<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9204, LAS: 0.8589, UEM: 0.4799, LEM: 0.2490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3397, partial_loss/deprel_loss: 1.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7552, loss: 0.9468, batch_reg_loss: 0.1106, reg_loss: 0.1098 ||: 72%|#######2 | 80/111 [00:53<00:20, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9212, LAS: 0.8595, UEM: 0.4774, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4129, partial_loss/deprel_loss: 0.5541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.9420, batch_reg_loss: 0.1107, reg_loss: 0.1098 ||: 76%|#######5 | 84/111 [00:55<00:17, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9211, LAS: 0.8593, UEM: 0.4725, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4724, partial_loss/deprel_loss: 0.6431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7198, loss: 0.9422, batch_reg_loss: 0.1108, reg_loss: 0.1098 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9214, LAS: 0.8598, UEM: 0.4746, LEM: 0.2414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.5323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6088, loss: 0.9386, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||: 83%|########2 | 92/111 [01:00<00:12, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9217, LAS: 0.8601, UEM: 0.4750, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2847, partial_loss/deprel_loss: 0.5046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9359, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||: 86%|########6 | 96/111 [01:03<00:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9220, LAS: 0.8605, UEM: 0.4788, LEM: 0.2450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.9335, batch_reg_loss: 0.1110, reg_loss: 0.1100 ||: 90%|######### | 100/111 [01:05<00:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9226, LAS: 0.8612, UEM: 0.4877, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.4301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.9288, batch_reg_loss: 0.1111, reg_loss: 0.1100 ||: 94%|#########3| 104/111 [01:08<00:04, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9225, LAS: 0.8610, UEM: 0.4866, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6775, partial_loss/deprel_loss: 0.9319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9303, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 97%|#########7| 108/111 [01:11<00:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.210 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.067 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - reg_loss | 0.110 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UEM | 0.507 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LAS | 0.862 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - loss | 0.920 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEM | 0.275 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UAS | 0.924 | N/A\n", + "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - EM | 0.949 | N/A\n", + "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Epoch duration: 0:01:14.089580\n", + "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Estimated training time remaining: 8:09:46\n", + "2023-04-06 23:26:39,192 - INFO - allennlp.training.trainer - Epoch 28/399\n", + "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:26:39,200 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9165, LAS: 0.8582, UEM: 0.6021, LEM: 0.3938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.9632, batch_reg_loss: 0.1113, reg_loss: 0.1113 ||: 3%|2 | 3/111 [00:02<01:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9296, LAS: 0.8705, UEM: 0.5821, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8214, partial_loss/deprel_loss: 1.0063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0807, loss: 0.8797, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||: 5%|5 | 6/111 [00:04<01:16, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9309, LAS: 0.8722, UEM: 0.5280, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.8538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.8659, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||: 8%|8 | 9/111 [00:06<01:14, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9298, LAS: 0.8711, UEM: 0.5151, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.5566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.8682, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||: 12%|#1 | 13/111 [00:09<01:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9341, LAS: 0.8772, UEM: 0.6051, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0950, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2843, loss: 0.8222, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||: 14%|#4 | 16/111 [00:11<01:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9353, LAS: 0.8781, UEM: 0.5912, LEM: 0.3662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3400, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.8082, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||: 17%|#7 | 19/111 [00:13<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9338, LAS: 0.8764, UEM: 0.5584, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.8871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9944, loss: 0.8188, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||: 21%|## | 23/111 [00:16<01:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9357, LAS: 0.8784, UEM: 0.5772, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.4073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.7985, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||: 23%|##3 | 26/111 [00:18<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9333, LAS: 0.8759, UEM: 0.5707, LEM: 0.3427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0747, partial_loss/deprel_loss: 0.9027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0489, loss: 0.8142, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||: 26%|##6 | 29/111 [00:20<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8281, UAS: 0.9316, LAS: 0.8740, UEM: 0.5647, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2179, partial_loss/deprel_loss: 1.0295, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1790, loss: 0.8310, batch_reg_loss: 0.1118, reg_loss: 0.1116 ||: 29%|##8 | 32/111 [00:22<00:58, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9268, LAS: 0.8688, UEM: 0.5456, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0683, partial_loss/deprel_loss: 0.9735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1044, loss: 0.8689, batch_reg_loss: 0.1119, reg_loss: 0.1116 ||: 32%|###1 | 35/111 [00:25<00:56, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9256, LAS: 0.8672, UEM: 0.5327, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6623, loss: 0.8821, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||: 35%|###5 | 39/111 [00:27<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9262, LAS: 0.8679, UEM: 0.5237, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4640, partial_loss/deprel_loss: 0.6099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6928, loss: 0.8753, batch_reg_loss: 0.1121, reg_loss: 0.1117 ||: 39%|###8 | 43/111 [00:30<00:46, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9260, LAS: 0.8675, UEM: 0.5286, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5349, partial_loss/deprel_loss: 0.5833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6858, loss: 0.8760, batch_reg_loss: 0.1122, reg_loss: 0.1117 ||: 42%|####2 | 47/111 [00:32<00:42, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9248, LAS: 0.8660, UEM: 0.5233, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2239, partial_loss/deprel_loss: 1.0366, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1863, loss: 0.8865, batch_reg_loss: 0.1123, reg_loss: 0.1117 ||: 46%|####5 | 51/111 [00:35<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9241, LAS: 0.8651, UEM: 0.5362, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4257, partial_loss/deprel_loss: 0.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7030, loss: 0.8954, batch_reg_loss: 0.1123, reg_loss: 0.1118 ||: 49%|####8 | 54/111 [00:37<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9245, LAS: 0.8652, UEM: 0.5354, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.8952, batch_reg_loss: 0.1124, reg_loss: 0.1118 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9239, LAS: 0.8643, UEM: 0.5229, LEM: 0.2924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0378, partial_loss/deprel_loss: 1.0526, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1621, loss: 0.9046, batch_reg_loss: 0.1125, reg_loss: 0.1118 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9243, LAS: 0.8646, UEM: 0.5144, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8400, partial_loss/deprel_loss: 0.8978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9988, loss: 0.9017, batch_reg_loss: 0.1125, reg_loss: 0.1119 ||: 58%|#####7 | 64/111 [00:44<00:31, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9241, LAS: 0.8643, UEM: 0.5133, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6003, loss: 0.9049, batch_reg_loss: 0.1126, reg_loss: 0.1119 ||: 61%|######1 | 68/111 [00:47<00:29, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9236, LAS: 0.8637, UEM: 0.5139, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.9107, batch_reg_loss: 0.1127, reg_loss: 0.1120 ||: 64%|######3 | 71/111 [00:49<00:27, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9230, LAS: 0.8629, UEM: 0.5046, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1078, partial_loss/deprel_loss: 1.0005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1347, loss: 0.9176, batch_reg_loss: 0.1128, reg_loss: 0.1120 ||: 68%|######7 | 75/111 [00:51<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9228, LAS: 0.8627, UEM: 0.5046, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3583, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.9189, batch_reg_loss: 0.1129, reg_loss: 0.1120 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9231, LAS: 0.8629, UEM: 0.4983, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7399, partial_loss/deprel_loss: 0.8801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9650, loss: 0.9165, batch_reg_loss: 0.1130, reg_loss: 0.1121 ||: 75%|#######4 | 83/111 [00:56<00:17, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9215, LAS: 0.8608, UEM: 0.4888, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.8282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.9335, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||: 78%|#######8 | 87/111 [00:59<00:15, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9220, LAS: 0.8617, UEM: 0.4992, LEM: 0.2722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3817, partial_loss/deprel_loss: 0.4937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5845, loss: 0.9263, batch_reg_loss: 0.1131, reg_loss: 0.1122 ||: 82%|########1 | 91/111 [01:02<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9226, LAS: 0.8625, UEM: 0.5122, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.7480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8618, loss: 0.9195, batch_reg_loss: 0.1132, reg_loss: 0.1122 ||: 86%|########5 | 95/111 [01:04<00:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9221, LAS: 0.8619, UEM: 0.5084, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7713, loss: 0.9258, batch_reg_loss: 0.1133, reg_loss: 0.1122 ||: 88%|########8 | 98/111 [01:07<00:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9228, LAS: 0.8628, UEM: 0.5095, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4700, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7098, loss: 0.9194, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||: 91%|######### | 101/111 [01:09<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9230, LAS: 0.8630, UEM: 0.5087, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.6215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.9173, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||: 94%|#########3| 104/111 [01:11<00:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9233, LAS: 0.8633, UEM: 0.5091, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.7718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8647, loss: 0.9148, batch_reg_loss: 0.1135, reg_loss: 0.1123 ||: 96%|#########6| 107/111 [01:13<00:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.055 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.150 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - reg_loss | 0.112 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UEM | 0.506 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - LAS | 0.863 | N/A\n", + "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - loss | 0.920 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEM | 0.277 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - UAS | 0.923 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EM | 0.829 | N/A\n", + "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Epoch duration: 0:01:16.367015\n", + "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Estimated training time remaining: 8:07:53\n", + "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Epoch 29/399\n", + "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:27:55,567 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9484, LAS: 0.8952, UEM: 0.6497, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.6486, batch_reg_loss: 0.1136, reg_loss: 0.1136 ||: 3%|2 | 3/111 [00:02<01:22, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9318, LAS: 0.8774, UEM: 0.5448, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 1.0995, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2447, loss: 0.8080, batch_reg_loss: 0.1137, reg_loss: 0.1136 ||: 5%|5 | 6/111 [00:04<01:20, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9304, LAS: 0.8744, UEM: 0.4970, LEM: 0.2492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9037, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.8255, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||: 8%|8 | 9/111 [00:06<01:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9234, LAS: 0.8670, UEM: 0.5124, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1069, partial_loss/deprel_loss: 1.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.8843, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||: 11%|# | 12/111 [00:09<01:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9279, LAS: 0.8722, UEM: 0.5277, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5707, partial_loss/deprel_loss: 0.5580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.8422, batch_reg_loss: 0.1139, reg_loss: 0.1137 ||: 14%|#3 | 15/111 [00:11<01:10, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9297, LAS: 0.8731, UEM: 0.5152, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8735, partial_loss/deprel_loss: 0.9656, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0611, loss: 0.8408, batch_reg_loss: 0.1139, reg_loss: 0.1138 ||: 16%|#6 | 18/111 [00:13<01:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9254, LAS: 0.8680, UEM: 0.4779, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 0.9413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.8777, batch_reg_loss: 0.1140, reg_loss: 0.1138 ||: 20%|#9 | 22/111 [00:15<01:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9271, LAS: 0.8695, UEM: 0.4928, LEM: 0.2473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.8677, batch_reg_loss: 0.1141, reg_loss: 0.1138 ||: 23%|##3 | 26/111 [00:18<00:56, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9297, LAS: 0.8723, UEM: 0.5254, LEM: 0.2732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.8417, batch_reg_loss: 0.1142, reg_loss: 0.1139 ||: 26%|##6 | 29/111 [00:20<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9264, LAS: 0.8679, UEM: 0.4938, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9940, partial_loss/deprel_loss: 0.9541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8794, batch_reg_loss: 0.1143, reg_loss: 0.1139 ||: 30%|##9 | 33/111 [00:22<00:52, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9259, LAS: 0.8670, UEM: 0.4878, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6497, loss: 0.8870, batch_reg_loss: 0.1143, reg_loss: 0.1140 ||: 32%|###2 | 36/111 [00:25<00:51, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9254, LAS: 0.8666, UEM: 0.4828, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2760, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1758, loss: 0.8918, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||: 35%|###5 | 39/111 [00:27<00:50, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9239, LAS: 0.8647, UEM: 0.4670, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2418, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1581, loss: 0.9075, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||: 38%|###7 | 42/111 [00:29<00:48, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9235, LAS: 0.8640, UEM: 0.4682, LEM: 0.2383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.5971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9136, batch_reg_loss: 0.1145, reg_loss: 0.1140 ||: 41%|#### | 45/111 [00:31<00:47, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9244, LAS: 0.8653, UEM: 0.4755, LEM: 0.2426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0601, partial_loss/deprel_loss: 1.0311, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1515, loss: 0.9071, batch_reg_loss: 0.1146, reg_loss: 0.1141 ||: 43%|####3 | 48/111 [00:34<00:48, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9235, LAS: 0.8643, UEM: 0.4635, LEM: 0.2325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5594, partial_loss/deprel_loss: 1.1760, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 0.9154, batch_reg_loss: 0.1147, reg_loss: 0.1141 ||: 47%|####6 | 52/111 [00:36<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8303, UAS: 0.9236, LAS: 0.8641, UEM: 0.4612, LEM: 0.2281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1919, partial_loss/deprel_loss: 1.0681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2076, loss: 0.9156, batch_reg_loss: 0.1147, reg_loss: 0.1142 ||: 50%|####9 | 55/111 [00:38<00:40, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9229, LAS: 0.8635, UEM: 0.4512, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7935, partial_loss/deprel_loss: 0.7807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8981, loss: 0.9207, batch_reg_loss: 0.1148, reg_loss: 0.1142 ||: 53%|#####3 | 59/111 [00:41<00:36, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9232, LAS: 0.8639, UEM: 0.4533, LEM: 0.2245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7478, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9175, batch_reg_loss: 0.1149, reg_loss: 0.1142 ||: 57%|#####6 | 63/111 [00:44<00:32, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9243, LAS: 0.8649, UEM: 0.4697, LEM: 0.2379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.9061, batch_reg_loss: 0.1150, reg_loss: 0.1143 ||: 60%|###### | 67/111 [00:46<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9244, LAS: 0.8650, UEM: 0.4710, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3257, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5574, loss: 0.9044, batch_reg_loss: 0.1151, reg_loss: 0.1143 ||: 64%|######3 | 71/111 [00:49<00:26, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9256, LAS: 0.8662, UEM: 0.4812, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5280, loss: 0.8951, batch_reg_loss: 0.1151, reg_loss: 0.1144 ||: 68%|######7 | 75/111 [00:52<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9258, LAS: 0.8662, UEM: 0.4778, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0733, partial_loss/deprel_loss: 1.0164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1430, loss: 0.8939, batch_reg_loss: 0.1152, reg_loss: 0.1144 ||: 71%|#######1 | 79/111 [00:54<00:20, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9250, LAS: 0.8653, UEM: 0.4695, LEM: 0.2337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8547, loss: 0.9007, batch_reg_loss: 0.1153, reg_loss: 0.1144 ||: 75%|#######4 | 83/111 [00:57<00:18, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9255, LAS: 0.8657, UEM: 0.4783, LEM: 0.2420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0986, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1513, loss: 0.8969, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||: 78%|#######8 | 87/111 [00:59<00:15, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9263, LAS: 0.8668, UEM: 0.4890, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6777, partial_loss/deprel_loss: 0.7179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8253, loss: 0.8871, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||: 82%|########1 | 91/111 [01:02<00:13, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7511, UAS: 0.9233, LAS: 0.8634, UEM: 0.4815, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6230, partial_loss/deprel_loss: 1.7261, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0210, loss: 0.9162, batch_reg_loss: 0.1155, reg_loss: 0.1146 ||: 86%|########5 | 95/111 [01:05<00:10, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8200, UAS: 0.9234, LAS: 0.8636, UEM: 0.4813, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2783, partial_loss/deprel_loss: 1.1654, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3036, loss: 0.9147, batch_reg_loss: 0.1156, reg_loss: 0.1146 ||: 89%|########9 | 99/111 [01:07<00:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7740, UAS: 0.9232, LAS: 0.8632, UEM: 0.4859, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9147, partial_loss/deprel_loss: 1.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6113, loss: 0.9170, batch_reg_loss: 0.1157, reg_loss: 0.1146 ||: 93%|#########2| 103/111 [01:10<00:05, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9242, LAS: 0.8645, UEM: 0.5148, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0692, partial_loss/deprel_loss: 0.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2916, loss: 0.9075, batch_reg_loss: 0.1158, reg_loss: 0.1147 ||: 95%|#########5| 106/111 [01:14<00:04, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9248, LAS: 0.8652, UEM: 0.5157, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5760, loss: 0.9015, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||: 99%|#########9| 110/111 [01:17<00:00, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7932, UAS: 0.9241, LAS: 0.8645, UEM: 0.5140, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8952, partial_loss/deprel_loss: 1.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5700, loss: 0.9075, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.344 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.895 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - reg_loss | 0.115 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UEM | 0.514 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LAS | 0.865 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - loss | 0.908 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEM | 0.282 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UAS | 0.924 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EM | 0.793 | N/A\n", + "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Epoch duration: 0:01:17.829257\n", + "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:21\n", + "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Epoch 30/399\n", + "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:29:13,390 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:29:13,396 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9423, LAS: 0.8831, UEM: 0.5266, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8957, partial_loss/deprel_loss: 0.8831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0016, loss: 0.7764, batch_reg_loss: 0.1160, reg_loss: 0.1159 ||: 4%|3 | 4/111 [00:02<01:10, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9297, LAS: 0.8704, UEM: 0.4777, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4410, partial_loss/deprel_loss: 1.0704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2605, loss: 0.8706, batch_reg_loss: 0.1160, reg_loss: 0.1160 ||: 6%|6 | 7/111 [00:04<01:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7884, UAS: 0.9209, LAS: 0.8615, UEM: 0.4229, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9655, partial_loss/deprel_loss: 1.3005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5497, loss: 0.9493, batch_reg_loss: 0.1161, reg_loss: 0.1160 ||: 10%|9 | 11/111 [00:07<01:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9205, LAS: 0.8604, UEM: 0.4367, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3561, partial_loss/deprel_loss: 0.5195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.9509, batch_reg_loss: 0.1162, reg_loss: 0.1160 ||: 13%|#2 | 14/111 [00:09<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9244, LAS: 0.8644, UEM: 0.4492, LEM: 0.2016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4715, partial_loss/deprel_loss: 0.6246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.9135, batch_reg_loss: 0.1162, reg_loss: 0.1161 ||: 15%|#5 | 17/111 [00:11<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9269, LAS: 0.8684, UEM: 0.4862, LEM: 0.2381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1172, partial_loss/deprel_loss: 0.9006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0602, loss: 0.8846, batch_reg_loss: 0.1163, reg_loss: 0.1161 ||: 18%|#8 | 20/111 [00:13<01:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9247, LAS: 0.8656, UEM: 0.4565, LEM: 0.2166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6565, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9340, loss: 0.9051, batch_reg_loss: 0.1164, reg_loss: 0.1161 ||: 22%|##1 | 24/111 [00:16<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7923, UAS: 0.9189, LAS: 0.8592, UEM: 0.4360, LEM: 0.2045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9101, partial_loss/deprel_loss: 1.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5238, loss: 0.9555, batch_reg_loss: 0.1164, reg_loss: 0.1162 ||: 24%|##4 | 27/111 [00:18<00:57, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8100, UAS: 0.9204, LAS: 0.8606, UEM: 0.4805, LEM: 0.2478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4343, partial_loss/deprel_loss: 1.1992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3628, loss: 0.9425, batch_reg_loss: 0.1165, reg_loss: 0.1162 ||: 27%|##7 | 30/111 [00:20<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9195, LAS: 0.8595, UEM: 0.4778, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3692, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6280, loss: 0.9496, batch_reg_loss: 0.1166, reg_loss: 0.1162 ||: 31%|### | 34/111 [00:23<00:54, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8410, UAS: 0.9186, LAS: 0.8582, UEM: 0.4590, LEM: 0.2313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0912, partial_loss/deprel_loss: 0.9415, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0881, loss: 0.9539, batch_reg_loss: 0.1167, reg_loss: 0.1163 ||: 34%|###4 | 38/111 [00:26<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9205, LAS: 0.8606, UEM: 0.4768, LEM: 0.2436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5354, loss: 0.9355, batch_reg_loss: 0.1168, reg_loss: 0.1163 ||: 38%|###7 | 42/111 [00:28<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7559, UAS: 0.9180, LAS: 0.8576, UEM: 0.4588, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5943, partial_loss/deprel_loss: 1.6157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9283, loss: 0.9636, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||: 41%|####1 | 46/111 [00:31<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9180, LAS: 0.8578, UEM: 0.4674, LEM: 0.2415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.1822, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9619, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||: 44%|####4 | 49/111 [00:33<00:44, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9181, LAS: 0.8578, UEM: 0.4559, LEM: 0.2312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2104, loss: 0.9637, batch_reg_loss: 0.1170, reg_loss: 0.1165 ||: 48%|####7 | 53/111 [00:36<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9192, LAS: 0.8589, UEM: 0.4595, LEM: 0.2339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 1.0027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.9569, batch_reg_loss: 0.1171, reg_loss: 0.1165 ||: 51%|#####1 | 57/111 [00:39<00:36, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9202, LAS: 0.8601, UEM: 0.4839, LEM: 0.2551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.9449, batch_reg_loss: 0.1172, reg_loss: 0.1165 ||: 55%|#####4 | 61/111 [00:41<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9211, LAS: 0.8613, UEM: 0.4880, LEM: 0.2559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6812, partial_loss/deprel_loss: 0.7970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8911, loss: 0.9362, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9211, LAS: 0.8612, UEM: 0.4893, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.8934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 0.9348, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||: 60%|###### | 67/111 [00:46<00:31, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9214, LAS: 0.8614, UEM: 0.4829, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.6596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7614, loss: 0.9320, batch_reg_loss: 0.1174, reg_loss: 0.1166 ||: 63%|######3 | 70/111 [00:48<00:28, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9210, LAS: 0.8611, UEM: 0.4750, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3160, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2391, loss: 0.9346, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||: 67%|######6 | 74/111 [00:50<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9217, LAS: 0.8620, UEM: 0.4883, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1238, partial_loss/deprel_loss: 0.2637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3533, loss: 0.9277, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||: 69%|######9 | 77/111 [00:52<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9227, LAS: 0.8631, UEM: 0.4886, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.9184, batch_reg_loss: 0.1176, reg_loss: 0.1168 ||: 73%|#######2 | 81/111 [00:55<00:19, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9236, LAS: 0.8643, UEM: 0.4999, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.9100, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||: 77%|#######6 | 85/111 [00:58<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9248, LAS: 0.8659, UEM: 0.5212, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.1867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2816, loss: 0.8990, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||: 79%|#######9 | 88/111 [01:00<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9253, LAS: 0.8663, UEM: 0.5287, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3533, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6751, loss: 0.8959, batch_reg_loss: 0.1178, reg_loss: 0.1169 ||: 82%|########1 | 91/111 [01:02<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9255, LAS: 0.8665, UEM: 0.5249, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8944, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||: 86%|########5 | 95/111 [01:05<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9255, LAS: 0.8662, UEM: 0.5190, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.7722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8451, loss: 0.8972, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||: 89%|########9 | 99/111 [01:07<00:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9260, LAS: 0.8667, UEM: 0.5188, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5216, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8915, batch_reg_loss: 0.1180, reg_loss: 0.1170 ||: 93%|#########2| 103/111 [01:10<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9252, LAS: 0.8656, UEM: 0.5142, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5122, partial_loss/deprel_loss: 0.7142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7919, loss: 0.9013, batch_reg_loss: 0.1181, reg_loss: 0.1170 ||: 95%|#########5| 106/111 [01:12<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8074, UAS: 0.9252, LAS: 0.8657, UEM: 0.5133, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5927, partial_loss/deprel_loss: 1.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4642, loss: 0.9032, batch_reg_loss: 0.1181, reg_loss: 0.1171 ||: 99%|#########9| 110/111 [01:15<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7988, UAS: 0.9247, LAS: 0.8651, UEM: 0.5116, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6141, partial_loss/deprel_loss: 1.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4702, loss: 0.9083, batch_reg_loss: 0.1182, reg_loss: 0.1171 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:30:29,126 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8614, UAS: 0.9506, LAS: 0.8947, UEM: 0.6800, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0408, partial_loss/deprel_loss: 44.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 35.5832, loss: 24.8075, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.09it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9518, LAS: 0.8976, UEM: 0.6637, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 17.7429, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2723, loss: 22.5560, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9389, LAS: 0.8836, UEM: 0.6104, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9587, partial_loss/deprel_loss: 37.7004, partial_loss/cycle_loss: 0.0000, batch_loss: 30.3521, loss: 26.7216, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8765, UAS: 0.9361, LAS: 0.8796, UEM: 0.5538, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6483, partial_loss/deprel_loss: 35.0183, partial_loss/cycle_loss: 0.0000, batch_loss: 28.1443, loss: 27.8730, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9399, LAS: 0.8846, UEM: 0.6236, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 20.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3867, loss: 26.3771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.06it/s]\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.286 | 20.438\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.614 | 0.180\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - reg_loss | 0.117 | 0.000\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UEM | 0.512 | 0.624\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LAS | 0.865 | 0.885\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - loss | 0.908 | 26.377\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEM | 0.282 | 0.353\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UAS | 0.925 | 0.940\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EM | 0.799 | 0.937\n", + "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Epoch duration: 0:01:28.054718\n", + "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:52\n", + "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Epoch 31/399\n", + "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:30:41,445 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:30:41,452 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9334, LAS: 0.8786, UEM: 0.4443, LEM: 0.1990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7236, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8045, batch_reg_loss: 0.1182, reg_loss: 0.1182 ||: 4%|3 | 4/111 [00:02<01:04, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9250, LAS: 0.8677, UEM: 0.5060, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1941, partial_loss/deprel_loss: 1.0869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2266, loss: 0.8819, batch_reg_loss: 0.1183, reg_loss: 0.1182 ||: 6%|6 | 7/111 [00:04<01:04, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9246, LAS: 0.8647, UEM: 0.5259, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.9099, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||: 9%|9 | 10/111 [00:06<01:06, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9163, LAS: 0.8569, UEM: 0.4684, LEM: 0.2328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7216, partial_loss/deprel_loss: 1.2022, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4245, loss: 0.9877, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||: 12%|#1 | 13/111 [00:08<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9163, LAS: 0.8573, UEM: 0.4320, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4364, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7002, loss: 0.9823, batch_reg_loss: 0.1185, reg_loss: 0.1183 ||: 15%|#5 | 17/111 [00:11<01:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9213, LAS: 0.8638, UEM: 0.5339, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0738, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2866, loss: 0.9381, batch_reg_loss: 0.1186, reg_loss: 0.1184 ||: 19%|#8 | 21/111 [00:13<00:59, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7860, UAS: 0.9181, LAS: 0.8604, UEM: 0.5074, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8301, partial_loss/deprel_loss: 1.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 0.9604, batch_reg_loss: 0.1187, reg_loss: 0.1184 ||: 22%|##1 | 24/111 [00:16<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9206, LAS: 0.8625, UEM: 0.5125, LEM: 0.3077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.9412, batch_reg_loss: 0.1188, reg_loss: 0.1185 ||: 25%|##5 | 28/111 [00:18<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9232, LAS: 0.8654, UEM: 0.5107, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.6426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7371, loss: 0.9181, batch_reg_loss: 0.1189, reg_loss: 0.1185 ||: 29%|##8 | 32/111 [00:21<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9209, LAS: 0.8630, UEM: 0.5014, LEM: 0.2881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6350, partial_loss/deprel_loss: 0.7174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9377, batch_reg_loss: 0.1189, reg_loss: 0.1186 ||: 32%|###2 | 36/111 [00:23<00:49, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9208, LAS: 0.8625, UEM: 0.4858, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7292, partial_loss/deprel_loss: 0.8410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9377, loss: 0.9367, batch_reg_loss: 0.1190, reg_loss: 0.1186 ||: 36%|###6 | 40/111 [00:26<00:45, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9211, LAS: 0.8619, UEM: 0.4705, LEM: 0.2575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7919, partial_loss/deprel_loss: 0.9952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0737, loss: 0.9432, batch_reg_loss: 0.1191, reg_loss: 0.1186 ||: 40%|###9 | 44/111 [00:28<00:41, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9221, LAS: 0.8633, UEM: 0.4997, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0615, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1421, loss: 0.9287, batch_reg_loss: 0.1192, reg_loss: 0.1187 ||: 43%|####3 | 48/111 [00:31<00:41, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9231, LAS: 0.8644, UEM: 0.5092, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0852, partial_loss/deprel_loss: 1.0912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2093, loss: 0.9185, batch_reg_loss: 0.1193, reg_loss: 0.1187 ||: 47%|####6 | 52/111 [00:34<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7887, UAS: 0.9225, LAS: 0.8640, UEM: 0.5098, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1006, partial_loss/deprel_loss: 1.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5885, loss: 0.9214, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||: 50%|####9 | 55/111 [00:37<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9226, LAS: 0.8640, UEM: 0.5125, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3773, partial_loss/deprel_loss: 0.6483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7135, loss: 0.9201, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||: 52%|#####2 | 58/111 [00:39<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9233, LAS: 0.8648, UEM: 0.5058, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7419, loss: 0.9154, batch_reg_loss: 0.1195, reg_loss: 0.1188 ||: 56%|#####5 | 62/111 [00:41<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9228, LAS: 0.8639, UEM: 0.4991, LEM: 0.2779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.9395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0740, loss: 0.9225, batch_reg_loss: 0.1196, reg_loss: 0.1189 ||: 59%|#####9 | 66/111 [00:44<00:29, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9241, LAS: 0.8651, UEM: 0.5039, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4332, partial_loss/deprel_loss: 0.6507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.9121, batch_reg_loss: 0.1197, reg_loss: 0.1189 ||: 63%|######3 | 70/111 [00:46<00:26, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9232, LAS: 0.8641, UEM: 0.4970, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1236, loss: 0.9186, batch_reg_loss: 0.1197, reg_loss: 0.1190 ||: 67%|######6 | 74/111 [00:49<00:23, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9234, LAS: 0.8646, UEM: 0.4956, LEM: 0.2692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3508, partial_loss/deprel_loss: 0.4847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.9129, batch_reg_loss: 0.1198, reg_loss: 0.1190 ||: 70%|####### | 78/111 [00:51<00:21, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9245, LAS: 0.8657, UEM: 0.4978, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6454, partial_loss/deprel_loss: 0.8686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9439, loss: 0.9062, batch_reg_loss: 0.1199, reg_loss: 0.1191 ||: 74%|#######3 | 82/111 [00:54<00:18, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9247, LAS: 0.8661, UEM: 0.5063, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.8663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.9016, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||: 77%|#######7 | 86/111 [00:57<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9252, LAS: 0.8666, UEM: 0.5083, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.8977, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||: 80%|######## | 89/111 [00:59<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8134, UAS: 0.9248, LAS: 0.8661, UEM: 0.5076, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3499, partial_loss/deprel_loss: 1.1000, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2701, loss: 0.9023, batch_reg_loss: 0.1201, reg_loss: 0.1192 ||: 83%|########2 | 92/111 [01:01<00:13, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9230, LAS: 0.8643, UEM: 0.4989, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.9014, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0436, loss: 0.9173, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||: 86%|########6 | 96/111 [01:04<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9233, LAS: 0.8645, UEM: 0.4989, LEM: 0.2735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2969, partial_loss/deprel_loss: 0.4878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.9146, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||: 89%|########9 | 99/111 [01:06<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9238, LAS: 0.8649, UEM: 0.5049, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8979, partial_loss/deprel_loss: 0.9199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0358, loss: 0.9114, batch_reg_loss: 0.1203, reg_loss: 0.1193 ||: 92%|#########1| 102/111 [01:08<00:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9244, LAS: 0.8655, UEM: 0.5149, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1225, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1554, loss: 0.9060, batch_reg_loss: 0.1204, reg_loss: 0.1193 ||: 95%|#########4| 105/111 [01:10<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9240, LAS: 0.8650, UEM: 0.5085, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.9104, batch_reg_loss: 0.1205, reg_loss: 0.1193 ||: 98%|#########8| 109/111 [01:13<00:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9245, LAS: 0.8656, UEM: 0.5131, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7048, loss: 0.9049, batch_reg_loss: 0.1205, reg_loss: 0.1194 ||: 100%|##########| 111/111 [01:14<00:00, 1.48it/s]\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.609 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.485 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - reg_loss | 0.119 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UEM | 0.513 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LAS | 0.866 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - loss | 0.905 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEM | 0.283 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UAS | 0.925 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EM | 0.891 | N/A\n", + "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Epoch duration: 0:01:14.783878\n", + "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Estimated training time remaining: 8:04:42\n", + "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Epoch 32/399\n", + "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:31:56,229 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:31:56,236 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9280, LAS: 0.8652, UEM: 0.3878, LEM: 0.1763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0858, partial_loss/deprel_loss: 1.0690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1930, loss: 0.9121, batch_reg_loss: 0.1206, reg_loss: 0.1205 ||: 4%|3 | 4/111 [00:02<01:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9222, LAS: 0.8593, UEM: 0.3942, LEM: 0.1663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.7455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9508, batch_reg_loss: 0.1206, reg_loss: 0.1206 ||: 6%|6 | 7/111 [00:04<01:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9268, LAS: 0.8661, UEM: 0.4804, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.8993, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9294, LAS: 0.8701, UEM: 0.4779, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9712, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0567, loss: 0.8729, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||: 12%|#1 | 13/111 [00:08<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9245, LAS: 0.8648, UEM: 0.4336, LEM: 0.2022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7990, partial_loss/deprel_loss: 0.7857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.9191, batch_reg_loss: 0.1208, reg_loss: 0.1207 ||: 14%|#4 | 16/111 [00:11<01:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9268, LAS: 0.8677, UEM: 0.5322, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0926, partial_loss/deprel_loss: 0.2178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3136, loss: 0.8968, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||: 17%|#7 | 19/111 [00:13<01:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9291, LAS: 0.8698, UEM: 0.5301, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5335, partial_loss/deprel_loss: 0.6623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.8739, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||: 20%|#9 | 22/111 [00:15<01:06, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9269, LAS: 0.8675, UEM: 0.5307, LEM: 0.3049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3634, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.8880, batch_reg_loss: 0.1210, reg_loss: 0.1207 ||: 23%|##2 | 25/111 [00:18<01:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9255, LAS: 0.8662, UEM: 0.5171, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1714, partial_loss/deprel_loss: 1.0061, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1602, loss: 0.9002, batch_reg_loss: 0.1210, reg_loss: 0.1208 ||: 25%|##5 | 28/111 [00:20<01:03, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9248, LAS: 0.8655, UEM: 0.5165, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.4554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.9082, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||: 28%|##7 | 31/111 [00:22<01:01, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9272, LAS: 0.8687, UEM: 0.5406, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4217, loss: 0.8810, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||: 31%|### | 34/111 [00:25<00:59, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9299, LAS: 0.8714, UEM: 0.5655, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4713, loss: 0.8544, batch_reg_loss: 0.1212, reg_loss: 0.1209 ||: 34%|###4 | 38/111 [00:27<00:54, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9285, LAS: 0.8704, UEM: 0.5675, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1536, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5566, loss: 0.8616, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||: 37%|###6 | 41/111 [00:30<00:53, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9300, LAS: 0.8721, UEM: 0.5725, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3764, partial_loss/deprel_loss: 0.4992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.8479, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||: 40%|###9 | 44/111 [00:32<00:50, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9297, LAS: 0.8715, UEM: 0.5590, LEM: 0.3199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.8563, batch_reg_loss: 0.1214, reg_loss: 0.1210 ||: 43%|####3 | 48/111 [00:35<00:46, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9309, LAS: 0.8732, UEM: 0.5558, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4737, partial_loss/deprel_loss: 0.6535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8460, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||: 47%|####6 | 52/111 [00:37<00:41, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9302, LAS: 0.8723, UEM: 0.5439, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6993, partial_loss/deprel_loss: 0.7695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8770, loss: 0.8525, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||: 50%|##### | 56/111 [00:40<00:37, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.9306, LAS: 0.8729, UEM: 0.5460, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0724, partial_loss/deprel_loss: 1.0548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1799, loss: 0.8494, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||: 53%|#####3 | 59/111 [00:42<00:37, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9290, LAS: 0.8712, UEM: 0.5358, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2836, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1690, loss: 0.8636, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||: 56%|#####5 | 62/111 [00:44<00:34, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9293, LAS: 0.8715, UEM: 0.5296, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.7730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8775, loss: 0.8617, batch_reg_loss: 0.1217, reg_loss: 0.1211 ||: 59%|#####9 | 66/111 [00:47<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.9263, LAS: 0.8683, UEM: 0.5209, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4318, partial_loss/deprel_loss: 1.0938, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2831, loss: 0.8883, batch_reg_loss: 0.1218, reg_loss: 0.1211 ||: 62%|######2 | 69/111 [00:49<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9263, LAS: 0.8683, UEM: 0.5139, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8951, loss: 0.8890, batch_reg_loss: 0.1218, reg_loss: 0.1212 ||: 66%|######5 | 73/111 [00:51<00:24, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8262, UAS: 0.9260, LAS: 0.8681, UEM: 0.5085, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1389, partial_loss/deprel_loss: 1.0152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1619, loss: 0.8884, batch_reg_loss: 0.1219, reg_loss: 0.1212 ||: 69%|######9 | 77/111 [00:54<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9255, LAS: 0.8675, UEM: 0.5156, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3720, loss: 0.8924, batch_reg_loss: 0.1220, reg_loss: 0.1213 ||: 73%|#######2 | 81/111 [00:57<00:19, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9251, LAS: 0.8669, UEM: 0.5146, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3275, partial_loss/deprel_loss: 0.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.8963, batch_reg_loss: 0.1221, reg_loss: 0.1213 ||: 77%|#######6 | 85/111 [00:59<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9257, LAS: 0.8675, UEM: 0.5170, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8591, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 0.8924, batch_reg_loss: 0.1222, reg_loss: 0.1213 ||: 79%|#######9 | 88/111 [01:02<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9258, LAS: 0.8675, UEM: 0.5237, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1875, partial_loss/deprel_loss: 0.3560, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.8923, batch_reg_loss: 0.1222, reg_loss: 0.1214 ||: 82%|########1 | 91/111 [01:04<00:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9254, LAS: 0.8670, UEM: 0.5240, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.8989, batch_reg_loss: 0.1223, reg_loss: 0.1214 ||: 86%|########5 | 95/111 [01:07<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9248, LAS: 0.8662, UEM: 0.5177, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 0.8869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0248, loss: 0.9030, batch_reg_loss: 0.1224, reg_loss: 0.1214 ||: 88%|########8 | 98/111 [01:09<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9248, LAS: 0.8662, UEM: 0.5197, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.8229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9171, loss: 0.9023, batch_reg_loss: 0.1225, reg_loss: 0.1215 ||: 92%|#########1| 102/111 [01:11<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.9248, LAS: 0.8661, UEM: 0.5155, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9436, loss: 0.9038, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||: 95%|#########5| 106/111 [01:14<00:03, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9251, LAS: 0.8664, UEM: 0.5153, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7650, partial_loss/deprel_loss: 0.8273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9375, loss: 0.9013, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||: 99%|#########9| 110/111 [01:16<00:00, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8006, UAS: 0.9245, LAS: 0.8658, UEM: 0.5134, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5343, partial_loss/deprel_loss: 1.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4532, loss: 0.9062, batch_reg_loss: 0.1227, reg_loss: 0.1215 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.280 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.534 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - reg_loss | 0.122 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UEM | 0.513 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LAS | 0.866 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - loss | 0.906 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEM | 0.284 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UAS | 0.925 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EM | 0.801 | N/A\n", + "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Epoch duration: 0:01:17.486642\n", + "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Estimated training time remaining: 8:03:06\n", + "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Epoch 33/399\n", + "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:33:13,716 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:33:13,722 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9211, LAS: 0.8634, UEM: 0.2448, LEM: 0.0606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2054, partial_loss/deprel_loss: 0.9809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1485, loss: 0.9179, batch_reg_loss: 0.1227, reg_loss: 0.1227 ||: 4%|3 | 4/111 [00:02<01:16, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9216, LAS: 0.8649, UEM: 0.4007, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8307, partial_loss/deprel_loss: 0.7976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9270, loss: 0.9128, batch_reg_loss: 0.1228, reg_loss: 0.1227 ||: 6%|6 | 7/111 [00:05<01:17, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9301, LAS: 0.8748, UEM: 0.4858, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5363, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6713, loss: 0.8323, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||: 9%|9 | 10/111 [00:07<01:16, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9291, LAS: 0.8730, UEM: 0.4607, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.7278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 0.8399, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||: 13%|#2 | 14/111 [00:10<01:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9238, LAS: 0.8661, UEM: 0.4238, LEM: 0.2058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1477, partial_loss/deprel_loss: 1.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1666, loss: 0.9019, batch_reg_loss: 0.1230, reg_loss: 0.1228 ||: 15%|#5 | 17/111 [00:12<01:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9265, LAS: 0.8681, UEM: 0.4492, LEM: 0.2182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.8846, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||: 18%|#8 | 20/111 [00:14<01:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9254, LAS: 0.8666, UEM: 0.4648, LEM: 0.2258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8170, partial_loss/deprel_loss: 1.3568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5720, loss: 0.8961, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||: 21%|## | 23/111 [00:16<01:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9235, LAS: 0.8644, UEM: 0.4432, LEM: 0.2090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1372, partial_loss/deprel_loss: 0.9852, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1388, loss: 0.9177, batch_reg_loss: 0.1232, reg_loss: 0.1229 ||: 24%|##4 | 27/111 [00:18<00:57, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9265, LAS: 0.8682, UEM: 0.4929, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.8827, batch_reg_loss: 0.1232, reg_loss: 0.1230 ||: 27%|##7 | 30/111 [00:21<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9256, LAS: 0.8672, UEM: 0.4734, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9334, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8918, batch_reg_loss: 0.1233, reg_loss: 0.1230 ||: 30%|##9 | 33/111 [00:23<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9268, LAS: 0.8684, UEM: 0.4827, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.7842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8856, loss: 0.8809, batch_reg_loss: 0.1234, reg_loss: 0.1230 ||: 32%|###2 | 36/111 [00:25<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9268, LAS: 0.8687, UEM: 0.4928, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1770, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4536, loss: 0.8786, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||: 36%|###6 | 40/111 [00:27<00:47, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7844, UAS: 0.9267, LAS: 0.8682, UEM: 0.4953, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8813, partial_loss/deprel_loss: 1.3088, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5469, loss: 0.8836, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||: 40%|###9 | 44/111 [00:30<00:44, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9241, LAS: 0.8655, UEM: 0.4929, LEM: 0.2566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8672, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9084, batch_reg_loss: 0.1236, reg_loss: 0.1231 ||: 43%|####3 | 48/111 [00:33<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9233, LAS: 0.8647, UEM: 0.4857, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4534, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.9137, batch_reg_loss: 0.1237, reg_loss: 0.1232 ||: 47%|####6 | 52/111 [00:35<00:39, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9234, LAS: 0.8646, UEM: 0.4809, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.9135, batch_reg_loss: 0.1238, reg_loss: 0.1232 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9234, LAS: 0.8646, UEM: 0.5000, LEM: 0.2691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1320, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3734, loss: 0.9154, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9247, LAS: 0.8660, UEM: 0.5193, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2943, partial_loss/deprel_loss: 0.4989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.9023, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||: 57%|#####6 | 63/111 [00:44<00:37, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9245, LAS: 0.8655, UEM: 0.5094, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.9076, batch_reg_loss: 0.1240, reg_loss: 0.1233 ||: 60%|###### | 67/111 [00:47<00:32, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9238, LAS: 0.8647, UEM: 0.5004, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0190, partial_loss/deprel_loss: 0.8973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0457, loss: 0.9132, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||: 63%|######3 | 70/111 [00:49<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9256, LAS: 0.8670, UEM: 0.5380, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7758, loss: 0.8967, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||: 66%|######5 | 73/111 [00:51<00:28, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9259, LAS: 0.8673, UEM: 0.5356, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4678, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6266, loss: 0.8944, batch_reg_loss: 0.1242, reg_loss: 0.1234 ||: 68%|######8 | 76/111 [00:53<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9264, LAS: 0.8678, UEM: 0.5363, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5585, partial_loss/deprel_loss: 0.7297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8197, loss: 0.8902, batch_reg_loss: 0.1242, reg_loss: 0.1235 ||: 71%|#######1 | 79/111 [00:56<00:24, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7776, UAS: 0.9260, LAS: 0.8674, UEM: 0.5386, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2130, partial_loss/deprel_loss: 1.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6674, loss: 0.8933, batch_reg_loss: 0.1243, reg_loss: 0.1235 ||: 74%|#######3 | 82/111 [00:58<00:22, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9256, LAS: 0.8668, UEM: 0.5348, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7456, partial_loss/deprel_loss: 0.7852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.8981, batch_reg_loss: 0.1244, reg_loss: 0.1235 ||: 77%|#######6 | 85/111 [01:00<00:19, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9255, LAS: 0.8665, UEM: 0.5300, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5330, partial_loss/deprel_loss: 0.6727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.8982, batch_reg_loss: 0.1244, reg_loss: 0.1236 ||: 80%|######## | 89/111 [01:03<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9262, LAS: 0.8673, UEM: 0.5294, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4852, partial_loss/deprel_loss: 0.6245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.8921, batch_reg_loss: 0.1245, reg_loss: 0.1236 ||: 83%|########2 | 92/111 [01:05<00:13, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9261, LAS: 0.8670, UEM: 0.5272, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3968, partial_loss/deprel_loss: 0.5528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.8936, batch_reg_loss: 0.1246, reg_loss: 0.1236 ||: 86%|########6 | 96/111 [01:08<00:10, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9254, LAS: 0.8662, UEM: 0.5244, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5442, partial_loss/deprel_loss: 0.9765, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2147, loss: 0.8996, batch_reg_loss: 0.1246, reg_loss: 0.1237 ||: 89%|########9 | 99/111 [01:10<00:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9260, LAS: 0.8668, UEM: 0.5231, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7287, partial_loss/deprel_loss: 0.8699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9663, loss: 0.8954, batch_reg_loss: 0.1247, reg_loss: 0.1237 ||: 93%|#########2| 103/111 [01:12<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9264, LAS: 0.8673, UEM: 0.5263, LEM: 0.2927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6999, loss: 0.8923, batch_reg_loss: 0.1248, reg_loss: 0.1237 ||: 95%|#########5| 106/111 [01:14<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9260, LAS: 0.8666, UEM: 0.5221, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2286, partial_loss/deprel_loss: 1.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3174, loss: 0.8969, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||: 99%|#########9| 110/111 [01:17<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9261, LAS: 0.8668, UEM: 0.5215, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8961, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||: 100%|##########| 111/111 [01:17<00:00, 1.42it/s]\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.710 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.597 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - reg_loss | 0.124 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UEM | 0.522 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LAS | 0.867 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - loss | 0.896 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEM | 0.289 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UAS | 0.926 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EM | 0.884 | N/A\n", + "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Epoch duration: 0:01:17.923745\n", + "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Estimated training time remaining: 8:01:36\n", + "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Epoch 34/399\n", + "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:34:31,640 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:34:31,646 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9111, LAS: 0.8494, UEM: 0.1556, LEM: 0.0333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7581, partial_loss/deprel_loss: 0.8816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9818, loss: 1.0546, batch_reg_loss: 0.1249, reg_loss: 0.1249 ||: 3%|2 | 3/111 [00:02<01:13, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9056, LAS: 0.8439, UEM: 0.2538, LEM: 0.0790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 1.0748, batch_reg_loss: 0.1250, reg_loss: 0.1249 ||: 5%|5 | 6/111 [00:04<01:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9077, LAS: 0.8464, UEM: 0.3817, LEM: 0.1861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7655, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5088, loss: 1.0438, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||: 8%|8 | 9/111 [00:06<01:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9136, LAS: 0.8528, UEM: 0.3986, LEM: 0.1842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6326, partial_loss/deprel_loss: 0.7305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0011, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||: 11%|# | 12/111 [00:08<01:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8578, UAS: 0.9196, LAS: 0.8600, UEM: 0.4359, LEM: 0.1994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 0.8639, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.9523, batch_reg_loss: 0.1252, reg_loss: 0.1250 ||: 14%|#4 | 16/111 [00:10<01:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9183, LAS: 0.8599, UEM: 0.4232, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4165, partial_loss/deprel_loss: 1.0787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2716, loss: 0.9521, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||: 18%|#8 | 20/111 [00:13<01:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9221, LAS: 0.8642, UEM: 0.4556, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.9203, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||: 21%|## | 23/111 [00:15<01:01, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9262, LAS: 0.8687, UEM: 0.4854, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4130, partial_loss/deprel_loss: 0.5913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.8882, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9281, LAS: 0.8704, UEM: 0.4951, LEM: 0.2408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3141, partial_loss/deprel_loss: 0.4727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5664, loss: 0.8715, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||: 26%|##6 | 29/111 [00:20<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9292, LAS: 0.8718, UEM: 0.5290, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3000, partial_loss/deprel_loss: 0.4808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.8581, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||: 29%|##8 | 32/111 [00:22<00:59, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9294, LAS: 0.8719, UEM: 0.5231, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.5997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.8609, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||: 32%|###2 | 36/111 [00:25<00:53, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9275, LAS: 0.8696, UEM: 0.5066, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9660, partial_loss/deprel_loss: 0.8184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9736, loss: 0.8780, batch_reg_loss: 0.1256, reg_loss: 0.1253 ||: 36%|###6 | 40/111 [00:27<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9269, LAS: 0.8686, UEM: 0.4966, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4479, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7006, loss: 0.8859, batch_reg_loss: 0.1257, reg_loss: 0.1253 ||: 40%|###9 | 44/111 [00:30<00:45, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9260, LAS: 0.8677, UEM: 0.4901, LEM: 0.2465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8959, batch_reg_loss: 0.1258, reg_loss: 0.1253 ||: 42%|####2 | 47/111 [00:32<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9266, LAS: 0.8686, UEM: 0.4965, LEM: 0.2503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2710, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.8885, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||: 46%|####5 | 51/111 [00:35<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9264, LAS: 0.8687, UEM: 0.5060, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0437, partial_loss/deprel_loss: 0.9126, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.8867, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||: 49%|####8 | 54/111 [00:37<00:39, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9265, LAS: 0.8685, UEM: 0.4986, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4914, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.8885, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9267, LAS: 0.8690, UEM: 0.5166, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8846, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||: 54%|#####4 | 60/111 [00:41<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9268, LAS: 0.8693, UEM: 0.5151, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.8828, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||: 57%|#####6 | 63/111 [00:44<00:35, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9262, LAS: 0.8687, UEM: 0.5069, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5799, partial_loss/deprel_loss: 0.7299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8261, loss: 0.8887, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||: 59%|#####9 | 66/111 [00:46<00:32, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9267, LAS: 0.8691, UEM: 0.5082, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.6044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.8859, batch_reg_loss: 0.1262, reg_loss: 0.1256 ||: 62%|######2 | 69/111 [00:48<00:31, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.9255, LAS: 0.8676, UEM: 0.4995, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6270, partial_loss/deprel_loss: 1.1887, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4026, loss: 0.8979, batch_reg_loss: 0.1263, reg_loss: 0.1256 ||: 65%|######4 | 72/111 [00:50<00:29, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9261, LAS: 0.8686, UEM: 0.5204, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.8069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8909, batch_reg_loss: 0.1264, reg_loss: 0.1256 ||: 68%|######7 | 75/111 [00:53<00:27, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9257, LAS: 0.8678, UEM: 0.5206, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2415, partial_loss/deprel_loss: 1.1330, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2811, loss: 0.8966, batch_reg_loss: 0.1264, reg_loss: 0.1257 ||: 71%|#######1 | 79/111 [00:55<00:23, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9256, LAS: 0.8678, UEM: 0.5151, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6984, partial_loss/deprel_loss: 0.7058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8308, loss: 0.8966, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||: 74%|#######3 | 82/111 [00:58<00:21, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.9253, LAS: 0.8674, UEM: 0.5110, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1613, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.9004, batch_reg_loss: 0.1266, reg_loss: 0.1257 ||: 77%|#######6 | 85/111 [01:00<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9256, LAS: 0.8676, UEM: 0.5044, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7210, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9277, loss: 0.8993, batch_reg_loss: 0.1266, reg_loss: 0.1258 ||: 80%|######## | 89/111 [01:02<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9267, LAS: 0.8690, UEM: 0.5185, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.8883, batch_reg_loss: 0.1267, reg_loss: 0.1258 ||: 84%|########3 | 93/111 [01:05<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9271, LAS: 0.8695, UEM: 0.5184, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.7246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8667, loss: 0.8846, batch_reg_loss: 0.1268, reg_loss: 0.1258 ||: 87%|########7 | 97/111 [01:07<00:09, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8105, UAS: 0.9253, LAS: 0.8672, UEM: 0.5146, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3796, partial_loss/deprel_loss: 1.2244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3823, loss: 0.9042, batch_reg_loss: 0.1269, reg_loss: 0.1259 ||: 91%|######### | 101/111 [01:10<00:06, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9253, LAS: 0.8672, UEM: 0.5136, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4786, partial_loss/deprel_loss: 0.7123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7925, loss: 0.9034, batch_reg_loss: 0.1270, reg_loss: 0.1259 ||: 95%|#########4| 105/111 [01:12<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9259, LAS: 0.8680, UEM: 0.5158, LEM: 0.2860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5921, loss: 0.8959, batch_reg_loss: 0.1270, reg_loss: 0.1260 ||: 98%|#########8| 109/111 [01:15<00:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9261, LAS: 0.8681, UEM: 0.5174, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8394, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9796, loss: 0.8944, batch_reg_loss: 0.1271, reg_loss: 0.1260 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.856 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.839 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - reg_loss | 0.126 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UEM | 0.517 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LAS | 0.868 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - loss | 0.894 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEM | 0.286 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UAS | 0.926 | N/A\n", + "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - EM | 0.853 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Epoch duration: 0:01:16.772068\n", + "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Estimated training time remaining: 7:59:54\n", + "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Epoch 35/399\n", + "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:35:48,412 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:35:48,418 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.9216, LAS: 0.8633, UEM: 0.5277, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1609, partial_loss/deprel_loss: 0.9063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8635, batch_reg_loss: 0.1272, reg_loss: 0.1271 ||: 4%|3 | 4/111 [00:02<01:10, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9235, LAS: 0.8655, UEM: 0.4402, LEM: 0.2191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5437, partial_loss/deprel_loss: 0.6562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7609, loss: 0.8720, batch_reg_loss: 0.1272, reg_loss: 0.1272 ||: 6%|6 | 7/111 [00:04<01:09, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9283, LAS: 0.8721, UEM: 0.5337, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.8287, batch_reg_loss: 0.1273, reg_loss: 0.1272 ||: 10%|9 | 11/111 [00:07<01:04, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9337, LAS: 0.8795, UEM: 0.6324, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8339, partial_loss/deprel_loss: 0.8628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9844, loss: 0.7854, batch_reg_loss: 0.1274, reg_loss: 0.1272 ||: 13%|#2 | 14/111 [00:09<01:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9359, LAS: 0.8817, UEM: 0.6234, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7271, loss: 0.7716, batch_reg_loss: 0.1274, reg_loss: 0.1273 ||: 15%|#5 | 17/111 [00:11<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9321, LAS: 0.8770, UEM: 0.5887, LEM: 0.3752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0131, loss: 0.8049, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||: 18%|#8 | 20/111 [00:13<01:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9340, LAS: 0.8787, UEM: 0.5950, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3717, partial_loss/deprel_loss: 0.6203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7990, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||: 21%|## | 23/111 [00:15<01:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9337, LAS: 0.8779, UEM: 0.5850, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2579, partial_loss/deprel_loss: 0.9992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1785, loss: 0.8028, batch_reg_loss: 0.1276, reg_loss: 0.1273 ||: 24%|##4 | 27/111 [00:17<00:55, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9350, LAS: 0.8794, UEM: 0.5883, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2687, partial_loss/deprel_loss: 0.4893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.7937, batch_reg_loss: 0.1276, reg_loss: 0.1274 ||: 27%|##7 | 30/111 [00:20<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9357, LAS: 0.8800, UEM: 0.5762, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6725, partial_loss/deprel_loss: 0.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8334, loss: 0.7902, batch_reg_loss: 0.1277, reg_loss: 0.1274 ||: 31%|### | 34/111 [00:22<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9370, LAS: 0.8816, UEM: 0.5877, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5669, partial_loss/deprel_loss: 0.7290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8244, loss: 0.7811, batch_reg_loss: 0.1278, reg_loss: 0.1274 ||: 33%|###3 | 37/111 [00:24<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9350, LAS: 0.8792, UEM: 0.5682, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2426, partial_loss/deprel_loss: 1.1232, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 0.8012, batch_reg_loss: 0.1278, reg_loss: 0.1275 ||: 37%|###6 | 41/111 [00:27<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7827, UAS: 0.9333, LAS: 0.8773, UEM: 0.5601, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1731, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6834, loss: 0.8193, batch_reg_loss: 0.1279, reg_loss: 0.1275 ||: 41%|#### | 45/111 [00:30<00:44, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.9327, LAS: 0.8767, UEM: 0.5487, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2953, partial_loss/deprel_loss: 0.9857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.8261, batch_reg_loss: 0.1280, reg_loss: 0.1275 ||: 44%|####4 | 49/111 [00:32<00:41, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9332, LAS: 0.8771, UEM: 0.5407, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6257, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9044, loss: 0.8255, batch_reg_loss: 0.1280, reg_loss: 0.1276 ||: 48%|####7 | 53/111 [00:35<00:37, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9305, LAS: 0.8738, UEM: 0.5267, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7496, partial_loss/deprel_loss: 0.8220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8506, batch_reg_loss: 0.1281, reg_loss: 0.1276 ||: 51%|#####1 | 57/111 [00:37<00:34, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9294, LAS: 0.8723, UEM: 0.5206, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.8612, batch_reg_loss: 0.1282, reg_loss: 0.1276 ||: 55%|#####4 | 61/111 [00:40<00:32, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9286, LAS: 0.8712, UEM: 0.5098, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6110, partial_loss/deprel_loss: 0.7682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8651, loss: 0.8717, batch_reg_loss: 0.1283, reg_loss: 0.1277 ||: 59%|#####8 | 65/111 [00:43<00:30, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9255, LAS: 0.8680, UEM: 0.4994, LEM: 0.2757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8341, partial_loss/deprel_loss: 0.8179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.8981, batch_reg_loss: 0.1284, reg_loss: 0.1277 ||: 62%|######2 | 69/111 [00:45<00:28, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9260, LAS: 0.8685, UEM: 0.5123, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7949, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9098, loss: 0.8941, batch_reg_loss: 0.1284, reg_loss: 0.1278 ||: 65%|######4 | 72/111 [00:47<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7804, UAS: 0.9254, LAS: 0.8680, UEM: 0.5102, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1089, partial_loss/deprel_loss: 1.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5832, loss: 0.8992, batch_reg_loss: 0.1285, reg_loss: 0.1278 ||: 68%|######7 | 75/111 [00:50<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9269, LAS: 0.8696, UEM: 0.5202, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2120, partial_loss/deprel_loss: 0.3991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.8862, batch_reg_loss: 0.1286, reg_loss: 0.1278 ||: 71%|#######1 | 79/111 [00:52<00:22, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9274, LAS: 0.8700, UEM: 0.5204, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3154, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.8838, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||: 74%|#######3 | 82/111 [00:55<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9281, LAS: 0.8709, UEM: 0.5253, LEM: 0.2929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.8759, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||: 77%|#######6 | 85/111 [00:57<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8220, UAS: 0.9270, LAS: 0.8697, UEM: 0.5177, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3218, partial_loss/deprel_loss: 1.0454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2295, loss: 0.8849, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||: 79%|#######9 | 88/111 [00:59<00:17, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9260, LAS: 0.8684, UEM: 0.5104, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4441, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4223, loss: 0.8980, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||: 83%|########2 | 92/111 [01:02<00:13, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9262, LAS: 0.8686, UEM: 0.5193, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3134, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8958, batch_reg_loss: 0.1289, reg_loss: 0.1280 ||: 86%|########5 | 95/111 [01:04<00:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9256, LAS: 0.8679, UEM: 0.5131, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 0.8091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9497, loss: 0.9019, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||: 88%|########8 | 98/111 [01:06<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9268, LAS: 0.8692, UEM: 0.5273, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3296, partial_loss/deprel_loss: 0.4673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.8912, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||: 91%|######### | 101/111 [01:08<00:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8077, UAS: 0.9265, LAS: 0.8689, UEM: 0.5272, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5767, partial_loss/deprel_loss: 1.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4546, loss: 0.8940, batch_reg_loss: 0.1291, reg_loss: 0.1281 ||: 94%|#########3| 104/111 [01:11<00:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9270, LAS: 0.8692, UEM: 0.5252, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9199, partial_loss/deprel_loss: 0.9289, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0563, loss: 0.8924, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||: 97%|#########7| 108/111 [01:13<00:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9271, LAS: 0.8694, UEM: 0.5212, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5733, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.8907, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:37:04,098 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9346, LAS: 0.8832, UEM: 0.6393, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6542, partial_loss/deprel_loss: 60.5480, partial_loss/cycle_loss: 0.0000, batch_loss: 48.7692, loss: 28.2319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:03<00:10, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9413, LAS: 0.8902, UEM: 0.6892, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 30.7479, partial_loss/cycle_loss: 0.0000, batch_loss: 24.7503, loss: 26.1370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:07, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9440, LAS: 0.8904, UEM: 0.6567, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 24.9592, partial_loss/cycle_loss: 0.0000, batch_loss: 20.0503, loss: 25.0336, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9429, LAS: 0.8893, UEM: 0.6474, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0086, partial_loss/deprel_loss: 44.8982, partial_loss/cycle_loss: 0.0000, batch_loss: 36.1203, loss: 26.7810, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9419, LAS: 0.8881, UEM: 0.6314, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 31.8272, partial_loss/cycle_loss: 0.0000, batch_loss: 25.6312, loss: 26.6926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.05it/s]\n", + "2023-04-06 23:37:16,466 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.638 | 31.827\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.573 | 0.847\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - reg_loss | 0.128 | 0.000\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UEM | 0.521 | 0.631\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - LAS | 0.869 | 0.888\n", + "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - loss | 0.891 | 26.693\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEM | 0.288 | 0.366\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - UAS | 0.927 | 0.942\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EM | 0.877 | 0.874\n", + "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Epoch duration: 0:01:28.057300\n", + "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Estimated training time remaining: 8:00:08\n", + "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Epoch 36/399\n", + "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-06 23:37:16,477 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9452, LAS: 0.8924, UEM: 0.5289, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.6698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7053, batch_reg_loss: 0.1293, reg_loss: 0.1293 ||: 3%|2 | 3/111 [00:02<01:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7919, UAS: 0.9146, LAS: 0.8533, UEM: 0.4009, LEM: 0.1795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6848, partial_loss/deprel_loss: 1.3093, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5138, loss: 1.0154, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||: 6%|6 | 7/111 [00:04<01:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9211, LAS: 0.8604, UEM: 0.4206, LEM: 0.1742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.6605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7498, loss: 0.9638, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||: 9%|9 | 10/111 [00:06<01:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9129, LAS: 0.8526, UEM: 0.3770, LEM: 0.1513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8000, partial_loss/deprel_loss: 0.7861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9183, loss: 1.0215, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||: 12%|#1 | 13/111 [00:08<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9189, LAS: 0.8602, UEM: 0.3997, LEM: 0.1637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4654, partial_loss/deprel_loss: 0.6501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7427, loss: 0.9621, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||: 14%|#4 | 16/111 [00:11<01:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8315, UAS: 0.9139, LAS: 0.8544, UEM: 0.3725, LEM: 0.1497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0556, partial_loss/deprel_loss: 1.0156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1532, loss: 1.0103, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||: 17%|#7 | 19/111 [00:13<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9164, LAS: 0.8573, UEM: 0.4090, LEM: 0.1805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.9840, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||: 20%|#9 | 22/111 [00:15<01:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9206, LAS: 0.8620, UEM: 0.5124, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0660, partial_loss/deprel_loss: 0.1975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3009, loss: 0.9505, batch_reg_loss: 0.1297, reg_loss: 0.1295 ||: 23%|##2 | 25/111 [00:17<01:05, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8453, UAS: 0.9192, LAS: 0.8603, UEM: 0.4831, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0821, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0308, loss: 0.9618, batch_reg_loss: 0.1298, reg_loss: 0.1295 ||: 26%|##6 | 29/111 [00:20<00:58, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9221, LAS: 0.8634, UEM: 0.5052, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1437, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4772, loss: 0.9353, batch_reg_loss: 0.1299, reg_loss: 0.1295 ||: 29%|##8 | 32/111 [00:22<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9198, LAS: 0.8611, UEM: 0.4829, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1443, partial_loss/deprel_loss: 0.8956, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0753, loss: 0.9539, batch_reg_loss: 0.1299, reg_loss: 0.1296 ||: 32%|###2 | 36/111 [00:25<00:52, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9206, LAS: 0.8620, UEM: 0.4807, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.6688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.9482, batch_reg_loss: 0.1300, reg_loss: 0.1296 ||: 35%|###5 | 39/111 [00:27<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9212, LAS: 0.8630, UEM: 0.4812, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1409, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1650, loss: 0.9400, batch_reg_loss: 0.1301, reg_loss: 0.1297 ||: 39%|###8 | 43/111 [00:29<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9227, LAS: 0.8648, UEM: 0.4976, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2244, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.9244, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||: 42%|####2 | 47/111 [00:32<00:42, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9247, LAS: 0.8669, UEM: 0.5112, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.9069, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||: 45%|####5 | 50/111 [00:34<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9256, LAS: 0.8678, UEM: 0.5218, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9718, partial_loss/deprel_loss: 0.9520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8975, batch_reg_loss: 0.1303, reg_loss: 0.1298 ||: 48%|####7 | 53/111 [00:36<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9273, LAS: 0.8700, UEM: 0.5428, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5033, partial_loss/deprel_loss: 0.6351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8805, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9283, LAS: 0.8711, UEM: 0.5485, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4286, partial_loss/deprel_loss: 0.5783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8710, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9295, LAS: 0.8725, UEM: 0.5627, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.8593, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||: 57%|#####6 | 63/111 [00:43<00:34, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9297, LAS: 0.8727, UEM: 0.5516, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5741, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8456, loss: 0.8591, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||: 60%|###### | 67/111 [00:46<00:30, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9298, LAS: 0.8726, UEM: 0.5457, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1037, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1326, loss: 0.8598, batch_reg_loss: 0.1306, reg_loss: 0.1299 ||: 64%|######3 | 71/111 [00:48<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9304, LAS: 0.8730, UEM: 0.5460, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3699, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.8557, batch_reg_loss: 0.1306, reg_loss: 0.1300 ||: 68%|######7 | 75/111 [00:51<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9292, LAS: 0.8716, UEM: 0.5398, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4855, partial_loss/deprel_loss: 1.0485, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2665, loss: 0.8661, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9298, LAS: 0.8723, UEM: 0.5468, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4292, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.8599, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||: 75%|#######4 | 83/111 [00:57<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9290, LAS: 0.8713, UEM: 0.5385, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5060, partial_loss/deprel_loss: 0.6993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7915, loss: 0.8692, batch_reg_loss: 0.1308, reg_loss: 0.1301 ||: 78%|#######8 | 87/111 [00:59<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9280, LAS: 0.8700, UEM: 0.5342, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7672, partial_loss/deprel_loss: 0.9964, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0814, loss: 0.8801, batch_reg_loss: 0.1309, reg_loss: 0.1301 ||: 82%|########1 | 91/111 [01:01<00:12, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9272, LAS: 0.8690, UEM: 0.5320, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2635, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.8877, batch_reg_loss: 0.1310, reg_loss: 0.1301 ||: 86%|########5 | 95/111 [01:04<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9272, LAS: 0.8689, UEM: 0.5316, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6200, loss: 0.8883, batch_reg_loss: 0.1310, reg_loss: 0.1302 ||: 88%|########8 | 98/111 [01:07<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9277, LAS: 0.8693, UEM: 0.5311, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6978, loss: 0.8848, batch_reg_loss: 0.1311, reg_loss: 0.1302 ||: 92%|#########1| 102/111 [01:09<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9277, LAS: 0.8695, UEM: 0.5285, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4234, partial_loss/deprel_loss: 0.5900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.8845, batch_reg_loss: 0.1312, reg_loss: 0.1302 ||: 95%|#########5| 106/111 [01:12<00:03, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9270, LAS: 0.8688, UEM: 0.5260, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5303, loss: 0.8900, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||: 99%|#########9| 110/111 [01:15<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9271, LAS: 0.8689, UEM: 0.5252, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5826, partial_loss/deprel_loss: 0.7173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8217, loss: 0.8894, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.717 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.583 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - reg_loss | 0.130 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - UEM | 0.525 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LAS | 0.869 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - loss | 0.889 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LEM | 0.287 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - UAS | 0.927 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EM | 0.874 | N/A\n", + "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Epoch duration: 0:01:15.709732\n", + "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Estimated training time remaining: 7:58:15\n", + "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Epoch 37/399\n", + "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:38:32,188 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9332, LAS: 0.8765, UEM: 0.4678, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3651, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5898, loss: 0.8393, batch_reg_loss: 0.1314, reg_loss: 0.1314 ||: 4%|3 | 4/111 [00:02<01:08, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9418, LAS: 0.8880, UEM: 0.6776, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5287, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7562, loss: 0.7479, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||: 6%|6 | 7/111 [00:05<01:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9401, LAS: 0.8861, UEM: 0.6351, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7604, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||: 9%|9 | 10/111 [00:07<01:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9390, LAS: 0.8841, UEM: 0.5888, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3963, partial_loss/deprel_loss: 0.5860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.7824, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||: 13%|#2 | 14/111 [00:09<01:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8355, UAS: 0.9365, LAS: 0.8814, UEM: 0.5696, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2521, partial_loss/deprel_loss: 0.9936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1770, loss: 0.8040, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||: 15%|#5 | 17/111 [00:11<01:03, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9375, LAS: 0.8818, UEM: 0.5544, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8096, loss: 0.7999, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||: 18%|#8 | 20/111 [00:13<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9373, LAS: 0.8809, UEM: 0.5360, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 0.7038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.8015, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||: 21%|## | 23/111 [00:15<00:59, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9358, LAS: 0.8789, UEM: 0.5296, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3506, partial_loss/deprel_loss: 0.5437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 0.8139, batch_reg_loss: 0.1318, reg_loss: 0.1316 ||: 24%|##4 | 27/111 [00:18<00:56, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9368, LAS: 0.8799, UEM: 0.5409, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.8028, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||: 28%|##7 | 31/111 [00:20<00:52, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9310, LAS: 0.8739, UEM: 0.5321, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7992, partial_loss/deprel_loss: 1.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4886, loss: 0.8534, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||: 31%|### | 34/111 [00:23<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9295, LAS: 0.8724, UEM: 0.5293, LEM: 0.2876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.6494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.8636, batch_reg_loss: 0.1320, reg_loss: 0.1317 ||: 34%|###4 | 38/111 [00:25<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9291, LAS: 0.8717, UEM: 0.5239, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7996, partial_loss/deprel_loss: 0.7570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.8671, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||: 37%|###6 | 41/111 [00:27<00:48, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9284, LAS: 0.8710, UEM: 0.5212, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8072, partial_loss/deprel_loss: 0.7757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.8724, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||: 40%|###9 | 44/111 [00:30<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9267, LAS: 0.8691, UEM: 0.5128, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.5814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6685, loss: 0.8894, batch_reg_loss: 0.1322, reg_loss: 0.1318 ||: 42%|####2 | 47/111 [00:32<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9279, LAS: 0.8706, UEM: 0.5283, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2007, partial_loss/deprel_loss: 0.3160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.8751, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||: 46%|####5 | 51/111 [00:35<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9263, LAS: 0.8688, UEM: 0.5287, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.8898, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||: 49%|####8 | 54/111 [00:37<00:41, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9249, LAS: 0.8676, UEM: 0.5162, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4259, partial_loss/deprel_loss: 0.9915, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2108, loss: 0.8998, batch_reg_loss: 0.1324, reg_loss: 0.1319 ||: 51%|#####1 | 57/111 [00:39<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9245, LAS: 0.8671, UEM: 0.5301, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1480, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3828, loss: 0.9042, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||: 54%|#####4 | 60/111 [00:41<00:36, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9240, LAS: 0.8665, UEM: 0.5210, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8904, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9674, loss: 0.9083, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||: 57%|#####6 | 63/111 [00:43<00:34, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9239, LAS: 0.8662, UEM: 0.5185, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3084, partial_loss/deprel_loss: 0.5285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6171, loss: 0.9107, batch_reg_loss: 0.1326, reg_loss: 0.1319 ||: 59%|#####9 | 66/111 [00:45<00:31, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9242, LAS: 0.8665, UEM: 0.5151, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3071, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5583, loss: 0.9102, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||: 63%|######3 | 70/111 [00:48<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9240, LAS: 0.8662, UEM: 0.5102, LEM: 0.2864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4604, partial_loss/deprel_loss: 1.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3878, loss: 0.9143, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||: 67%|######6 | 74/111 [00:50<00:24, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9252, LAS: 0.8674, UEM: 0.5201, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.6707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.9017, batch_reg_loss: 0.1328, reg_loss: 0.1321 ||: 70%|####### | 78/111 [00:53<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9250, LAS: 0.8668, UEM: 0.5147, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4345, partial_loss/deprel_loss: 0.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7721, loss: 0.9045, batch_reg_loss: 0.1329, reg_loss: 0.1321 ||: 74%|#######3 | 82/111 [00:55<00:18, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9257, LAS: 0.8676, UEM: 0.5136, LEM: 0.2802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7814, partial_loss/deprel_loss: 0.6975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8472, loss: 0.8976, batch_reg_loss: 0.1330, reg_loss: 0.1321 ||: 77%|#######7 | 86/111 [00:58<00:16, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9262, LAS: 0.8681, UEM: 0.5186, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9150, partial_loss/deprel_loss: 0.9404, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0683, loss: 0.8935, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||: 81%|########1 | 90/111 [01:00<00:13, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8307, UAS: 0.9267, LAS: 0.8686, UEM: 0.5241, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1581, partial_loss/deprel_loss: 0.9771, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8894, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||: 85%|########4 | 94/111 [01:03<00:10, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9258, LAS: 0.8677, UEM: 0.5219, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0681, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1631, loss: 0.8979, batch_reg_loss: 0.1332, reg_loss: 0.1323 ||: 88%|########8 | 98/111 [01:06<00:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9266, LAS: 0.8686, UEM: 0.5311, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3334, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.8899, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||: 92%|#########1| 102/111 [01:09<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9265, LAS: 0.8684, UEM: 0.5272, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7599, loss: 0.8925, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||: 95%|#########4| 105/111 [01:11<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9261, LAS: 0.8679, UEM: 0.5228, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5106, partial_loss/deprel_loss: 0.6320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7411, loss: 0.8953, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 97%|#########7| 108/111 [01:13<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.650 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.545 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - reg_loss | 0.132 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UEM | 0.522 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LAS | 0.868 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - loss | 0.891 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEM | 0.286 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UAS | 0.926 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EM | 0.894 | N/A\n", + "2023-04-06 23:39:48,044 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:39:48,044 - INFO - combo.training.trainer - Epoch duration: 0:01:15.865530\n", + "2023-04-06 23:39:48,045 - INFO - combo.training.trainer - Estimated training time remaining: 7:56:25\n", + "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Epoch 38/399\n", + "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:39:48,052 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9161, LAS: 0.8534, UEM: 0.1467, LEM: 0.0433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0036, partial_loss/deprel_loss: 0.8636, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9915, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||: 3%|2 | 3/111 [00:02<01:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8142, UAS: 0.9123, LAS: 0.8513, UEM: 0.1802, LEM: 0.0496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5122, partial_loss/deprel_loss: 1.1313, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3410, loss: 1.0190, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||: 5%|5 | 6/111 [00:04<01:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9073, LAS: 0.8475, UEM: 0.2964, LEM: 0.1575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3239, partial_loss/deprel_loss: 0.4766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 1.0513, batch_reg_loss: 0.1336, reg_loss: 0.1335 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9198, LAS: 0.8619, UEM: 0.4844, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5275, partial_loss/deprel_loss: 0.6271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.9421, batch_reg_loss: 0.1337, reg_loss: 0.1336 ||: 13%|#2 | 14/111 [00:09<01:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9218, LAS: 0.8642, UEM: 0.4745, LEM: 0.2762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3876, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6086, loss: 0.9359, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||: 15%|#5 | 17/111 [00:11<01:02, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9248, LAS: 0.8685, UEM: 0.4811, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4559, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.9002, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||: 19%|#8 | 21/111 [00:13<00:59, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9240, LAS: 0.8676, UEM: 0.4905, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.6274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7447, loss: 0.9093, batch_reg_loss: 0.1339, reg_loss: 0.1337 ||: 22%|##1 | 24/111 [00:16<01:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9241, LAS: 0.8673, UEM: 0.4942, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9047, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||: 24%|##4 | 27/111 [00:18<00:59, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9236, LAS: 0.8662, UEM: 0.4872, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3372, partial_loss/deprel_loss: 0.5897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6733, loss: 0.9112, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||: 27%|##7 | 30/111 [00:20<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9250, LAS: 0.8682, UEM: 0.5068, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5721, loss: 0.8960, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||: 30%|##9 | 33/111 [00:22<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7594, UAS: 0.9238, LAS: 0.8673, UEM: 0.5198, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6236, partial_loss/deprel_loss: 1.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9675, loss: 0.9092, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||: 32%|###2 | 36/111 [00:25<00:56, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9248, LAS: 0.8688, UEM: 0.5415, LEM: 0.3280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0372, partial_loss/deprel_loss: 0.9183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8961, batch_reg_loss: 0.1342, reg_loss: 0.1338 ||: 35%|###5 | 39/111 [00:27<00:53, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9254, LAS: 0.8697, UEM: 0.5361, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3875, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.8888, batch_reg_loss: 0.1343, reg_loss: 0.1338 ||: 38%|###7 | 42/111 [00:29<00:51, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9276, LAS: 0.8721, UEM: 0.5593, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1639, partial_loss/deprel_loss: 0.4386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5180, loss: 0.8677, batch_reg_loss: 0.1343, reg_loss: 0.1339 ||: 41%|####1 | 46/111 [00:32<00:46, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9286, LAS: 0.8729, UEM: 0.5516, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4020, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6780, loss: 0.8602, batch_reg_loss: 0.1344, reg_loss: 0.1339 ||: 45%|####5 | 50/111 [00:34<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8677, UAS: 0.9283, LAS: 0.8724, UEM: 0.5407, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7025, partial_loss/deprel_loss: 0.8024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9169, loss: 0.8647, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||: 48%|####7 | 53/111 [00:37<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9300, LAS: 0.8742, UEM: 0.5445, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3832, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.8520, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||: 51%|#####1 | 57/111 [00:39<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9292, LAS: 0.8732, UEM: 0.5361, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0990, partial_loss/deprel_loss: 0.9602, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1226, loss: 0.8597, batch_reg_loss: 0.1346, reg_loss: 0.1340 ||: 55%|#####4 | 61/111 [00:42<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8736, UEM: 0.5367, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4994, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6924, loss: 0.8544, batch_reg_loss: 0.1346, reg_loss: 0.1341 ||: 58%|#####7 | 64/111 [00:44<00:33, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9282, LAS: 0.8718, UEM: 0.5287, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7784, partial_loss/deprel_loss: 1.2841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5176, loss: 0.8678, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||: 60%|###### | 67/111 [00:46<00:30, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9276, LAS: 0.8711, UEM: 0.5219, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9674, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0079, loss: 0.8726, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||: 63%|######3 | 70/111 [00:48<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9280, LAS: 0.8714, UEM: 0.5153, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7153, loss: 0.8731, batch_reg_loss: 0.1348, reg_loss: 0.1341 ||: 67%|######6 | 74/111 [00:51<00:24, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8183, UAS: 0.9288, LAS: 0.8724, UEM: 0.5400, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4612, partial_loss/deprel_loss: 1.1146, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3188, loss: 0.8662, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||: 70%|####### | 78/111 [00:54<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9283, LAS: 0.8717, UEM: 0.5372, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6727, loss: 0.8713, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||: 73%|#######2 | 81/111 [00:56<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9280, LAS: 0.8713, UEM: 0.5341, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5286, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8738, batch_reg_loss: 0.1350, reg_loss: 0.1342 ||: 76%|#######5 | 84/111 [00:58<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9284, LAS: 0.8716, UEM: 0.5292, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6210, partial_loss/deprel_loss: 0.6848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.8722, batch_reg_loss: 0.1351, reg_loss: 0.1343 ||: 79%|#######9 | 88/111 [01:01<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9283, LAS: 0.8715, UEM: 0.5263, LEM: 0.3003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2265, partial_loss/deprel_loss: 0.9465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1377, loss: 0.8723, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||: 83%|########2 | 92/111 [01:03<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9284, LAS: 0.8716, UEM: 0.5317, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3219, partial_loss/deprel_loss: 0.5873, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6694, loss: 0.8716, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||: 86%|########6 | 96/111 [01:06<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7974, UAS: 0.9280, LAS: 0.8711, UEM: 0.5262, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.2148, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4368, loss: 0.8753, batch_reg_loss: 0.1353, reg_loss: 0.1344 ||: 90%|######### | 100/111 [01:09<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9261, LAS: 0.8692, UEM: 0.5205, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4797, partial_loss/deprel_loss: 1.0433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8891, batch_reg_loss: 0.1354, reg_loss: 0.1344 ||: 93%|#########2| 103/111 [01:11<00:05, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9259, LAS: 0.8689, UEM: 0.5149, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9886, partial_loss/deprel_loss: 0.9805, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1176, loss: 0.8923, batch_reg_loss: 0.1354, reg_loss: 0.1345 ||: 96%|#########6| 107/111 [01:14<00:02, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.493 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.261 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - reg_loss | 0.134 | N/A\n", + "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UEM | 0.516 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LAS | 0.870 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - loss | 0.888 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEM | 0.291 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - UAS | 0.926 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EM | 0.911 | N/A\n", + "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Epoch duration: 0:01:16.437091\n", + "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Estimated training time remaining: 7:54:43\n", + "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Epoch 39/399\n", + "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:41:04,489 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9271, LAS: 0.8726, UEM: 0.3130, LEM: 0.1275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7463, partial_loss/deprel_loss: 0.7432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.8727, batch_reg_loss: 0.1356, reg_loss: 0.1356 ||: 3%|2 | 3/111 [00:02<01:26, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9318, LAS: 0.8801, UEM: 0.6530, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.7412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8926, loss: 0.8137, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||: 5%|5 | 6/111 [00:04<01:23, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9279, LAS: 0.8751, UEM: 0.6365, LEM: 0.4647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4726, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.8520, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||: 8%|8 | 9/111 [00:07<01:20, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9365, LAS: 0.8843, UEM: 0.6833, LEM: 0.4764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1591, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.7746, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||: 11%|# | 12/111 [00:09<01:17, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9311, LAS: 0.8782, UEM: 0.6278, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4972, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6593, loss: 0.8231, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||: 14%|#4 | 16/111 [00:11<01:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9309, LAS: 0.8773, UEM: 0.5934, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9963, loss: 0.8333, batch_reg_loss: 0.1359, reg_loss: 0.1357 ||: 17%|#7 | 19/111 [00:14<01:07, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9315, LAS: 0.8780, UEM: 0.6091, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3746, loss: 0.8262, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||: 20%|#9 | 22/111 [00:16<01:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9291, LAS: 0.8751, UEM: 0.5884, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4094, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.8458, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||: 23%|##2 | 25/111 [00:18<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9310, LAS: 0.8771, UEM: 0.5775, LEM: 0.3731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4881, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7661, loss: 0.8331, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||: 25%|##5 | 28/111 [00:20<00:59, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9315, LAS: 0.8775, UEM: 0.5766, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.8266, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||: 28%|##7 | 31/111 [00:23<01:02, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9334, LAS: 0.8794, UEM: 0.5744, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4142, partial_loss/deprel_loss: 0.5945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.8153, batch_reg_loss: 0.1362, reg_loss: 0.1359 ||: 32%|###1 | 35/111 [00:25<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9338, LAS: 0.8798, UEM: 0.5824, LEM: 0.3585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.8117, batch_reg_loss: 0.1363, reg_loss: 0.1359 ||: 35%|###5 | 39/111 [00:28<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9350, LAS: 0.8810, UEM: 0.5892, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.5966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.8028, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||: 39%|###8 | 43/111 [00:30<00:45, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9368, LAS: 0.8829, UEM: 0.5965, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5324, loss: 0.7887, batch_reg_loss: 0.1364, reg_loss: 0.1360 ||: 42%|####2 | 47/111 [00:32<00:40, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8263, UAS: 0.9351, LAS: 0.8808, UEM: 0.5802, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2804, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2017, loss: 0.8047, batch_reg_loss: 0.1365, reg_loss: 0.1360 ||: 46%|####5 | 51/111 [00:35<00:38, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9341, LAS: 0.8795, UEM: 0.5765, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8381, partial_loss/deprel_loss: 1.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4981, loss: 0.8138, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||: 50%|####9 | 55/111 [00:38<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9343, LAS: 0.8798, UEM: 0.5758, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.8124, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||: 52%|#####2 | 58/111 [00:40<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9338, LAS: 0.8791, UEM: 0.5644, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5629, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7725, loss: 0.8162, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||: 56%|#####5 | 62/111 [00:42<00:31, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9340, LAS: 0.8790, UEM: 0.5651, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0235, partial_loss/deprel_loss: 0.9341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0887, loss: 0.8163, batch_reg_loss: 0.1367, reg_loss: 0.1362 ||: 59%|#####9 | 66/111 [00:45<00:28, 1.61it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9333, LAS: 0.8778, UEM: 0.5585, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8708, partial_loss/deprel_loss: 1.0278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1332, loss: 0.8263, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||: 63%|######3 | 70/111 [00:48<00:26, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9324, LAS: 0.8769, UEM: 0.5601, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6606, loss: 0.8319, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||: 67%|######6 | 74/111 [00:50<00:23, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9312, LAS: 0.8757, UEM: 0.5582, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3023, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.8426, batch_reg_loss: 0.1369, reg_loss: 0.1363 ||: 70%|####### | 78/111 [00:53<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9305, LAS: 0.8749, UEM: 0.5510, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3944, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8499, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||: 74%|#######3 | 82/111 [00:56<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9310, LAS: 0.8753, UEM: 0.5488, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3884, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.8477, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||: 77%|#######6 | 85/111 [00:58<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9303, LAS: 0.8745, UEM: 0.5408, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9831, partial_loss/deprel_loss: 0.8483, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0123, loss: 0.8528, batch_reg_loss: 0.1371, reg_loss: 0.1363 ||: 79%|#######9 | 88/111 [01:00<00:15, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9297, LAS: 0.8737, UEM: 0.5392, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4849, partial_loss/deprel_loss: 0.6716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7715, loss: 0.8581, batch_reg_loss: 0.1372, reg_loss: 0.1364 ||: 83%|########2 | 92/111 [01:02<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9299, LAS: 0.8737, UEM: 0.5393, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0448, partial_loss/deprel_loss: 0.8961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0631, loss: 0.8567, batch_reg_loss: 0.1373, reg_loss: 0.1364 ||: 86%|########6 | 96/111 [01:05<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9285, LAS: 0.8721, UEM: 0.5326, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6162, partial_loss/deprel_loss: 1.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4737, loss: 0.8717, batch_reg_loss: 0.1374, reg_loss: 0.1364 ||: 90%|######### | 100/111 [01:08<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9289, LAS: 0.8726, UEM: 0.5333, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8157, loss: 0.8672, batch_reg_loss: 0.1374, reg_loss: 0.1365 ||: 93%|#########2| 103/111 [01:10<00:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8184, UAS: 0.9280, LAS: 0.8714, UEM: 0.5288, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3722, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3191, loss: 0.8774, batch_reg_loss: 0.1375, reg_loss: 0.1365 ||: 96%|#########6| 107/111 [01:13<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.551 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.591 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - reg_loss | 0.137 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UEM | 0.526 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LAS | 0.871 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - loss | 0.879 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEM | 0.296 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UAS | 0.928 | N/A\n", + "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - EM | 0.889 | N/A\n", + "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Epoch duration: 0:01:15.902319\n", + "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Estimated training time remaining: 7:52:57\n", + "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Epoch 40/399\n", + "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:42:20,392 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9317, LAS: 0.8756, UEM: 0.5489, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8281, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9601, loss: 0.8450, batch_reg_loss: 0.1376, reg_loss: 0.1376 ||: 4%|3 | 4/111 [00:02<01:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9439, LAS: 0.8883, UEM: 0.6418, LEM: 0.3665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3450, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7376, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||: 6%|6 | 7/111 [00:05<01:17, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9406, LAS: 0.8849, UEM: 0.5977, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9597, partial_loss/deprel_loss: 0.8677, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0238, loss: 0.7623, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||: 9%|9 | 10/111 [00:07<01:15, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9310, LAS: 0.8748, UEM: 0.5612, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5104, partial_loss/deprel_loss: 0.6686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8476, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||: 12%|#1 | 13/111 [00:09<01:12, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9346, LAS: 0.8790, UEM: 0.5600, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.8156, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||: 14%|#4 | 16/111 [00:12<01:10, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9323, LAS: 0.8758, UEM: 0.5203, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9130, partial_loss/deprel_loss: 0.9827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1067, loss: 0.8472, batch_reg_loss: 0.1379, reg_loss: 0.1378 ||: 18%|#8 | 20/111 [00:14<01:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9317, LAS: 0.8753, UEM: 0.4986, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8557, batch_reg_loss: 0.1380, reg_loss: 0.1378 ||: 21%|## | 23/111 [00:16<01:03, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9292, LAS: 0.8729, UEM: 0.4781, LEM: 0.2357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6835, loss: 0.8777, batch_reg_loss: 0.1381, reg_loss: 0.1378 ||: 24%|##4 | 27/111 [00:19<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9319, LAS: 0.8755, UEM: 0.5036, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5178, partial_loss/deprel_loss: 0.6325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8563, batch_reg_loss: 0.1381, reg_loss: 0.1379 ||: 28%|##7 | 31/111 [00:21<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9352, LAS: 0.8802, UEM: 0.5864, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4408, partial_loss/deprel_loss: 0.6740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7656, loss: 0.8228, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||: 31%|### | 34/111 [00:24<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9331, LAS: 0.8780, UEM: 0.5720, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.8427, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||: 33%|###3 | 37/111 [00:26<00:53, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9335, LAS: 0.8782, UEM: 0.5702, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5566, loss: 0.8412, batch_reg_loss: 0.1383, reg_loss: 0.1380 ||: 37%|###6 | 41/111 [00:29<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9335, LAS: 0.8780, UEM: 0.5642, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8098, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9969, loss: 0.8421, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||: 40%|###9 | 44/111 [00:31<00:48, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9330, LAS: 0.8774, UEM: 0.5605, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6040, loss: 0.8485, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||: 42%|####2 | 47/111 [00:33<00:46, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9339, LAS: 0.8782, UEM: 0.5593, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5911, loss: 0.8408, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||: 45%|####5 | 50/111 [00:35<00:43, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9330, LAS: 0.8769, UEM: 0.5442, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8073, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8503, batch_reg_loss: 0.1385, reg_loss: 0.1381 ||: 49%|####8 | 54/111 [00:38<00:39, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9338, LAS: 0.8778, UEM: 0.5522, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 0.7195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8274, loss: 0.8418, batch_reg_loss: 0.1386, reg_loss: 0.1381 ||: 51%|#####1 | 57/111 [00:40<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9322, LAS: 0.8759, UEM: 0.5406, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8303, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0005, loss: 0.8547, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||: 55%|#####4 | 61/111 [00:43<00:34, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.9314, LAS: 0.8750, UEM: 0.5303, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.9400, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0926, loss: 0.8601, batch_reg_loss: 0.1387, reg_loss: 0.1382 ||: 59%|#####8 | 65/111 [00:45<00:29, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9322, LAS: 0.8760, UEM: 0.5436, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.4120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.8483, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||: 62%|######2 | 69/111 [00:48<00:27, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9315, LAS: 0.8752, UEM: 0.5358, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7962, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.8559, batch_reg_loss: 0.1389, reg_loss: 0.1382 ||: 66%|######5 | 73/111 [00:50<00:25, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9308, LAS: 0.8746, UEM: 0.5263, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9985, partial_loss/deprel_loss: 0.9882, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8618, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||: 69%|######9 | 77/111 [00:53<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9306, LAS: 0.8743, UEM: 0.5325, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2627, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8641, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||: 73%|#######2 | 81/111 [00:56<00:21, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9309, LAS: 0.8746, UEM: 0.5345, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3698, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.8614, batch_reg_loss: 0.1391, reg_loss: 0.1383 ||: 77%|#######6 | 85/111 [00:59<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9311, LAS: 0.8748, UEM: 0.5386, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1995, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4799, loss: 0.8597, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||: 79%|#######9 | 88/111 [01:01<00:15, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7752, UAS: 0.9306, LAS: 0.8743, UEM: 0.5397, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1589, partial_loss/deprel_loss: 1.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6607, loss: 0.8631, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||: 83%|########2 | 92/111 [01:03<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9301, LAS: 0.8737, UEM: 0.5393, LEM: 0.3071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.6012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.8662, batch_reg_loss: 0.1393, reg_loss: 0.1384 ||: 86%|########5 | 95/111 [01:06<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9305, LAS: 0.8740, UEM: 0.5404, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3724, partial_loss/deprel_loss: 0.5439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.8636, batch_reg_loss: 0.1393, reg_loss: 0.1385 ||: 88%|########8 | 98/111 [01:08<00:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8126, UAS: 0.9289, LAS: 0.8722, UEM: 0.5321, LEM: 0.3010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5588, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3808, loss: 0.8792, batch_reg_loss: 0.1394, reg_loss: 0.1385 ||: 92%|#########1| 102/111 [01:10<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9288, LAS: 0.8719, UEM: 0.5261, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6212, partial_loss/deprel_loss: 0.7073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8296, loss: 0.8832, batch_reg_loss: 0.1395, reg_loss: 0.1385 ||: 95%|#########5| 106/111 [01:13<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9283, LAS: 0.8714, UEM: 0.5235, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4445, partial_loss/deprel_loss: 1.0017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2298, loss: 0.8870, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||: 99%|#########9| 110/111 [01:16<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9286, LAS: 0.8717, UEM: 0.5255, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2913, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5934, loss: 0.8844, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||: 100%|##########| 111/111 [01:17<00:00, 1.44it/s]\n", + "2023-04-06 23:43:37,470 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9208, LAS: 0.8625, UEM: 0.4979, LEM: 0.1992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 25.0669, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1296, loss: 34.6105, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9200, LAS: 0.8624, UEM: 0.3798, LEM: 0.1298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2659, partial_loss/deprel_loss: 50.9556, partial_loss/cycle_loss: 0.0000, batch_loss: 41.0176, loss: 35.2960, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 31%|### | 4/13 [00:04<00:09, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9319, LAS: 0.8754, UEM: 0.4854, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 25.1574, partial_loss/cycle_loss: 0.0000, batch_loss: 20.2391, loss: 30.3282, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:06<00:05, 1.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9407, LAS: 0.8855, UEM: 0.6077, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3743, partial_loss/deprel_loss: 26.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 21.6387, loss: 28.1431, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:04, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9435, LAS: 0.8899, UEM: 0.6518, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 31.0434, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9755, loss: 26.9689, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9423, LAS: 0.8885, UEM: 0.6328, LEM: 0.3709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9222, partial_loss/deprel_loss: 32.1733, partial_loss/cycle_loss: 0.0000, batch_loss: 25.9231, loss: 26.8884, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.05it/s]\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.494 | 32.173\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.291 | 0.922\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - reg_loss | 0.139 | 0.000\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UEM | 0.525 | 0.633\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - LAS | 0.872 | 0.888\n", + "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - loss | 0.884 | 26.888\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEM | 0.294 | 0.371\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | 0.942\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EM | 0.911 | 0.871\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:43:49,822 - INFO - combo.training.trainer - Epoch duration: 0:01:29.437908\n", + "2023-04-06 23:43:49,823 - INFO - combo.training.trainer - Estimated training time remaining: 7:53:11\n", + "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Epoch 41/399\n", + "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:43:49,829 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9473, LAS: 0.8922, UEM: 0.5747, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.8736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9877, loss: 0.7340, batch_reg_loss: 0.1397, reg_loss: 0.1396 ||: 4%|3 | 4/111 [00:02<01:06, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9386, LAS: 0.8829, UEM: 0.5009, LEM: 0.2195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8012, batch_reg_loss: 0.1397, reg_loss: 0.1397 ||: 6%|6 | 7/111 [00:04<01:06, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9384, LAS: 0.8814, UEM: 0.4792, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.8055, batch_reg_loss: 0.1398, reg_loss: 0.1397 ||: 10%|9 | 11/111 [00:07<01:05, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9380, LAS: 0.8812, UEM: 0.4718, LEM: 0.1999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.7587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8718, loss: 0.8062, batch_reg_loss: 0.1399, reg_loss: 0.1397 ||: 14%|#3 | 15/111 [00:09<01:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9369, LAS: 0.8806, UEM: 0.4850, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.5864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7066, loss: 0.8159, batch_reg_loss: 0.1399, reg_loss: 0.1398 ||: 16%|#6 | 18/111 [00:12<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9404, LAS: 0.8844, UEM: 0.5462, LEM: 0.2671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2989, partial_loss/deprel_loss: 0.4637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.7806, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||: 19%|#8 | 21/111 [00:14<01:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9405, LAS: 0.8848, UEM: 0.5380, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.7739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9132, loss: 0.7765, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||: 22%|##1 | 24/111 [00:16<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9381, LAS: 0.8821, UEM: 0.5425, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4807, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7943, batch_reg_loss: 0.1401, reg_loss: 0.1398 ||: 24%|##4 | 27/111 [00:18<01:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9360, LAS: 0.8798, UEM: 0.5291, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2766, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8113, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||: 27%|##7 | 30/111 [00:20<00:56, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9353, LAS: 0.8792, UEM: 0.5505, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0839, partial_loss/deprel_loss: 0.9513, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1179, loss: 0.8167, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||: 30%|##9 | 33/111 [00:22<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9379, LAS: 0.8819, UEM: 0.5853, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1621, partial_loss/deprel_loss: 0.4345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.7952, batch_reg_loss: 0.1402, reg_loss: 0.1399 ||: 32%|###2 | 36/111 [00:25<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9373, LAS: 0.8810, UEM: 0.5804, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 0.6910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8111, loss: 0.8015, batch_reg_loss: 0.1403, reg_loss: 0.1399 ||: 36%|###6 | 40/111 [00:27<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9365, LAS: 0.8805, UEM: 0.5882, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1602, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4219, loss: 0.8045, batch_reg_loss: 0.1403, reg_loss: 0.1400 ||: 39%|###8 | 43/111 [00:29<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9357, LAS: 0.8799, UEM: 0.5839, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0559, partial_loss/deprel_loss: 0.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0364, loss: 0.8087, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||: 41%|####1 | 46/111 [00:32<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9341, LAS: 0.8782, UEM: 0.5697, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.8229, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||: 45%|####5 | 50/111 [00:34<00:41, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9332, LAS: 0.8772, UEM: 0.5581, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9401, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0405, loss: 0.8303, batch_reg_loss: 0.1405, reg_loss: 0.1401 ||: 48%|####7 | 53/111 [00:36<00:39, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9313, LAS: 0.8754, UEM: 0.5553, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7602, partial_loss/deprel_loss: 0.7644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9042, loss: 0.8451, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9299, LAS: 0.8736, UEM: 0.5401, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6608, partial_loss/deprel_loss: 0.7292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8562, loss: 0.8595, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9297, LAS: 0.8732, UEM: 0.5341, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2914, partial_loss/deprel_loss: 0.9993, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1984, loss: 0.8635, batch_reg_loss: 0.1407, reg_loss: 0.1401 ||: 57%|#####6 | 63/111 [00:43<00:33, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9302, LAS: 0.8736, UEM: 0.5320, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3977, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.8592, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||: 59%|#####9 | 66/111 [00:45<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9306, LAS: 0.8740, UEM: 0.5362, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5458, partial_loss/deprel_loss: 0.6075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8557, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||: 63%|######3 | 70/111 [00:48<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9305, LAS: 0.8737, UEM: 0.5287, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.8577, batch_reg_loss: 0.1409, reg_loss: 0.1402 ||: 67%|######6 | 74/111 [00:50<00:24, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9301, LAS: 0.8732, UEM: 0.5233, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6254, partial_loss/deprel_loss: 0.8169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9195, loss: 0.8652, batch_reg_loss: 0.1410, reg_loss: 0.1403 ||: 70%|####### | 78/111 [00:53<00:21, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9296, LAS: 0.8724, UEM: 0.5124, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8604, partial_loss/deprel_loss: 0.7997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9529, loss: 0.8711, batch_reg_loss: 0.1411, reg_loss: 0.1403 ||: 74%|#######3 | 82/111 [00:56<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.9287, LAS: 0.8713, UEM: 0.5086, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6232, partial_loss/deprel_loss: 1.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4060, loss: 0.8803, batch_reg_loss: 0.1411, reg_loss: 0.1404 ||: 77%|#######7 | 86/111 [00:58<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9289, LAS: 0.8716, UEM: 0.5090, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0425, loss: 0.8771, batch_reg_loss: 0.1412, reg_loss: 0.1404 ||: 81%|########1 | 90/111 [01:01<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9291, LAS: 0.8718, UEM: 0.5114, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2032, partial_loss/deprel_loss: 1.0468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2193, loss: 0.8760, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||: 84%|########3 | 93/111 [01:05<00:15, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9303, LAS: 0.8733, UEM: 0.5341, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0761, partial_loss/deprel_loss: 0.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2968, loss: 0.8647, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||: 86%|########6 | 96/111 [01:08<00:12, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9304, LAS: 0.8733, UEM: 0.5303, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4572, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8644, batch_reg_loss: 0.1414, reg_loss: 0.1405 ||: 90%|######### | 100/111 [01:10<00:08, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7828, UAS: 0.9302, LAS: 0.8732, UEM: 0.5366, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0178, partial_loss/deprel_loss: 1.2750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5650, loss: 0.8644, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||: 93%|#########2| 103/111 [01:12<00:06, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.9297, LAS: 0.8725, UEM: 0.5303, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2271, partial_loss/deprel_loss: 0.9879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1772, loss: 0.8693, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||: 96%|#########6| 107/111 [01:15<00:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.133 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.526 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - reg_loss | 0.141 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UEM | 0.525 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LAS | 0.871 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - loss | 0.877 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEM | 0.292 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EM | 0.808 | N/A\n", + "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Epoch duration: 0:01:17.811230\n", + "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Estimated training time remaining: 7:51:41\n", + "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Epoch 42/399\n", + "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:45:07,635 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:45:07,641 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9418, LAS: 0.8844, UEM: 0.6837, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1491, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.7424, batch_reg_loss: 0.1416, reg_loss: 0.1416 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9439, LAS: 0.8897, UEM: 0.6355, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.5091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6237, loss: 0.7500, batch_reg_loss: 0.1417, reg_loss: 0.1416 ||: 6%|6 | 7/111 [00:04<01:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9345, LAS: 0.8808, UEM: 0.5993, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8176, partial_loss/deprel_loss: 1.0696, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3609, loss: 0.8223, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||: 9%|9 | 10/111 [00:06<01:10, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9321, LAS: 0.8780, UEM: 0.5473, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9754, partial_loss/deprel_loss: 0.9375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0869, loss: 0.8430, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||: 12%|#1 | 13/111 [00:09<01:11, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9290, LAS: 0.8745, UEM: 0.5006, LEM: 0.2696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9098, partial_loss/deprel_loss: 0.8706, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0203, loss: 0.8699, batch_reg_loss: 0.1419, reg_loss: 0.1417 ||: 14%|#4 | 16/111 [00:11<01:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7885, UAS: 0.9225, LAS: 0.8667, UEM: 0.4693, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9202, partial_loss/deprel_loss: 1.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5509, loss: 0.9321, batch_reg_loss: 0.1419, reg_loss: 0.1418 ||: 17%|#7 | 19/111 [00:13<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9252, LAS: 0.8689, UEM: 0.4885, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2645, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.9091, batch_reg_loss: 0.1420, reg_loss: 0.1418 ||: 20%|#9 | 22/111 [00:15<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7888, UAS: 0.9224, LAS: 0.8653, UEM: 0.4605, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7105, partial_loss/deprel_loss: 1.1578, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4104, loss: 0.9309, batch_reg_loss: 0.1421, reg_loss: 0.1418 ||: 23%|##3 | 26/111 [00:18<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9242, LAS: 0.8673, UEM: 0.4631, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6195, partial_loss/deprel_loss: 0.7172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8398, loss: 0.9185, batch_reg_loss: 0.1421, reg_loss: 0.1419 ||: 27%|##7 | 30/111 [00:20<00:54, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9257, LAS: 0.8693, UEM: 0.4708, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4584, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6584, loss: 0.9047, batch_reg_loss: 0.1422, reg_loss: 0.1419 ||: 31%|### | 34/111 [00:22<00:49, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9266, LAS: 0.8708, UEM: 0.5190, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5656, partial_loss/deprel_loss: 1.1580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3818, loss: 0.8919, batch_reg_loss: 0.1423, reg_loss: 0.1419 ||: 34%|###4 | 38/111 [00:25<00:47, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9268, LAS: 0.8702, UEM: 0.5255, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6049, partial_loss/deprel_loss: 1.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4239, loss: 0.8945, batch_reg_loss: 0.1424, reg_loss: 0.1420 ||: 38%|###7 | 42/111 [00:28<00:44, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9244, LAS: 0.8681, UEM: 0.5113, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5069, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7131, loss: 0.9143, batch_reg_loss: 0.1425, reg_loss: 0.1420 ||: 41%|####1 | 46/111 [00:30<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9260, LAS: 0.8699, UEM: 0.5146, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9033, partial_loss/deprel_loss: 0.9612, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0922, loss: 0.9012, batch_reg_loss: 0.1425, reg_loss: 0.1421 ||: 45%|####5 | 50/111 [00:33<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9262, LAS: 0.8700, UEM: 0.5082, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.5459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6573, loss: 0.8964, batch_reg_loss: 0.1426, reg_loss: 0.1421 ||: 48%|####7 | 53/111 [00:35<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9264, LAS: 0.8700, UEM: 0.5088, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2628, partial_loss/deprel_loss: 0.4712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5722, loss: 0.8967, batch_reg_loss: 0.1427, reg_loss: 0.1421 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9269, LAS: 0.8703, UEM: 0.5012, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8432, partial_loss/deprel_loss: 0.8230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9697, loss: 0.8934, batch_reg_loss: 0.1427, reg_loss: 0.1422 ||: 54%|#####4 | 60/111 [00:40<00:33, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9261, LAS: 0.8694, UEM: 0.4960, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.9014, batch_reg_loss: 0.1428, reg_loss: 0.1422 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9270, LAS: 0.8702, UEM: 0.5018, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4418, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.8965, batch_reg_loss: 0.1429, reg_loss: 0.1422 ||: 61%|######1 | 68/111 [00:45<00:29, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9281, LAS: 0.8715, UEM: 0.5132, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3822, partial_loss/deprel_loss: 0.5883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.8848, batch_reg_loss: 0.1429, reg_loss: 0.1423 ||: 64%|######3 | 71/111 [00:47<00:27, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9280, LAS: 0.8712, UEM: 0.5081, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 0.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.8869, batch_reg_loss: 0.1430, reg_loss: 0.1423 ||: 68%|######7 | 75/111 [00:50<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9281, LAS: 0.8714, UEM: 0.5251, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4009, partial_loss/deprel_loss: 1.1302, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3274, loss: 0.8879, batch_reg_loss: 0.1431, reg_loss: 0.1423 ||: 71%|#######1 | 79/111 [00:53<00:21, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8092, UAS: 0.9276, LAS: 0.8707, UEM: 0.5240, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5534, partial_loss/deprel_loss: 1.0782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3164, loss: 0.8904, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||: 75%|#######4 | 83/111 [00:55<00:18, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9264, LAS: 0.8695, UEM: 0.5132, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9556, loss: 0.9018, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||: 78%|#######8 | 87/111 [00:58<00:15, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9264, LAS: 0.8696, UEM: 0.5124, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.9021, batch_reg_loss: 0.1433, reg_loss: 0.1425 ||: 82%|########1 | 91/111 [01:00<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9273, LAS: 0.8706, UEM: 0.5229, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.8934, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||: 86%|########5 | 95/111 [01:04<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9280, LAS: 0.8714, UEM: 0.5268, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.6957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.8872, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||: 88%|########8 | 98/111 [01:06<00:09, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8226, UAS: 0.9276, LAS: 0.8709, UEM: 0.5227, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2476, partial_loss/deprel_loss: 1.0486, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2319, loss: 0.8905, batch_reg_loss: 0.1435, reg_loss: 0.1425 ||: 91%|######### | 101/111 [01:08<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.9276, LAS: 0.8708, UEM: 0.5191, LEM: 0.2894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2091, partial_loss/deprel_loss: 0.9989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1845, loss: 0.8903, batch_reg_loss: 0.1435, reg_loss: 0.1426 ||: 94%|#########3| 104/111 [01:10<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9281, LAS: 0.8713, UEM: 0.5172, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3627, partial_loss/deprel_loss: 0.5546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8854, batch_reg_loss: 0.1436, reg_loss: 0.1426 ||: 97%|#########7| 108/111 [01:12<00:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9289, LAS: 0.8721, UEM: 0.5273, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1537, partial_loss/deprel_loss: 0.3458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4510, loss: 0.8789, batch_reg_loss: 0.1437, reg_loss: 0.1426 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:46:23,087 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.346 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.154 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - reg_loss | 0.143 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UEM | 0.527 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LAS | 0.872 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - loss | 0.879 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LEM | 0.295 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EM | 0.923 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:46:23,089 - INFO - combo.training.trainer - Epoch duration: 0:01:15.455331\n", + "2023-04-06 23:46:23,090 - INFO - combo.training.trainer - Estimated training time remaining: 7:49:52\n", + "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Epoch 43/399\n", + "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:46:23,096 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9428, LAS: 0.8899, UEM: 0.5301, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7088, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8902, loss: 0.7165, batch_reg_loss: 0.1437, reg_loss: 0.1437 ||: 4%|3 | 4/111 [00:02<01:12, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9305, LAS: 0.8755, UEM: 0.4153, LEM: 0.2112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9663, partial_loss/deprel_loss: 0.8616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0263, loss: 0.8579, batch_reg_loss: 0.1438, reg_loss: 0.1437 ||: 6%|6 | 7/111 [00:04<01:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9267, LAS: 0.8695, UEM: 0.3652, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7665, loss: 0.8932, batch_reg_loss: 0.1438, reg_loss: 0.1438 ||: 10%|9 | 11/111 [00:07<01:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9308, LAS: 0.8744, UEM: 0.4503, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5104, loss: 0.8467, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||: 13%|#2 | 14/111 [00:09<01:07, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9310, LAS: 0.8749, UEM: 0.4808, LEM: 0.2451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6832, loss: 0.8372, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||: 15%|#5 | 17/111 [00:11<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9305, LAS: 0.8744, UEM: 0.4984, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.4246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5237, loss: 0.8381, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||: 18%|#8 | 20/111 [00:14<01:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9311, LAS: 0.8754, UEM: 0.4955, LEM: 0.2494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4113, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6570, loss: 0.8374, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||: 21%|## | 23/111 [00:16<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9299, LAS: 0.8747, UEM: 0.5014, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0566, partial_loss/deprel_loss: 0.9292, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8457, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9280, LAS: 0.8729, UEM: 0.4755, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7893, partial_loss/deprel_loss: 0.7554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9063, loss: 0.8606, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||: 27%|##7 | 30/111 [00:20<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9309, LAS: 0.8757, UEM: 0.4968, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.7238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.8412, batch_reg_loss: 0.1442, reg_loss: 0.1439 ||: 31%|### | 34/111 [00:23<00:50, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8741, UEM: 0.4825, LEM: 0.2462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4805, partial_loss/deprel_loss: 0.6438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7554, loss: 0.8578, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||: 33%|###3 | 37/111 [00:25<00:49, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9296, LAS: 0.8747, UEM: 0.5280, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0719, partial_loss/deprel_loss: 0.1706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2952, loss: 0.8560, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||: 36%|###6 | 40/111 [00:27<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8147, UAS: 0.9272, LAS: 0.8719, UEM: 0.5142, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.0491, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2657, loss: 0.8769, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||: 39%|###8 | 43/111 [00:29<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9253, LAS: 0.8700, UEM: 0.5011, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.8194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9620, loss: 0.8908, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||: 41%|####1 | 46/111 [00:31<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9264, LAS: 0.8710, UEM: 0.5009, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.8833, batch_reg_loss: 0.1445, reg_loss: 0.1441 ||: 44%|####4 | 49/111 [00:33<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9273, LAS: 0.8721, UEM: 0.5077, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4123, partial_loss/deprel_loss: 0.5633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.8738, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||: 48%|####7 | 53/111 [00:36<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9277, LAS: 0.8724, UEM: 0.5111, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6128, loss: 0.8723, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9271, LAS: 0.8720, UEM: 0.5031, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6218, loss: 0.8758, batch_reg_loss: 0.1447, reg_loss: 0.1442 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9282, LAS: 0.8732, UEM: 0.5039, LEM: 0.2799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.8675, batch_reg_loss: 0.1448, reg_loss: 0.1442 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9280, LAS: 0.8729, UEM: 0.5005, LEM: 0.2765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7839, partial_loss/deprel_loss: 0.7660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.8710, batch_reg_loss: 0.1449, reg_loss: 0.1442 ||: 61%|######1 | 68/111 [00:46<00:27, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9287, LAS: 0.8736, UEM: 0.4970, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4859, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7367, loss: 0.8662, batch_reg_loss: 0.1449, reg_loss: 0.1443 ||: 65%|######4 | 72/111 [00:48<00:23, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8157, UAS: 0.9272, LAS: 0.8720, UEM: 0.4943, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5636, partial_loss/deprel_loss: 1.0879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3280, loss: 0.8815, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||: 68%|######8 | 76/111 [00:50<00:21, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8144, UAS: 0.9269, LAS: 0.8717, UEM: 0.5034, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5043, partial_loss/deprel_loss: 1.1348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3537, loss: 0.8843, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||: 72%|#######2 | 80/111 [00:53<00:18, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9266, LAS: 0.8709, UEM: 0.4931, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7594, partial_loss/deprel_loss: 0.8771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.8908, batch_reg_loss: 0.1451, reg_loss: 0.1444 ||: 76%|#######5 | 84/111 [00:55<00:16, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9272, LAS: 0.8716, UEM: 0.5056, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8835, batch_reg_loss: 0.1452, reg_loss: 0.1444 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9283, LAS: 0.8730, UEM: 0.5235, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4175, loss: 0.8710, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||: 83%|########2 | 92/111 [01:01<00:13, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9284, LAS: 0.8731, UEM: 0.5205, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4851, partial_loss/deprel_loss: 0.6839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8712, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||: 86%|########6 | 96/111 [01:04<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9279, LAS: 0.8724, UEM: 0.5209, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1321, partial_loss/deprel_loss: 1.0463, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8762, batch_reg_loss: 0.1454, reg_loss: 0.1445 ||: 90%|######### | 100/111 [01:06<00:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9277, LAS: 0.8722, UEM: 0.5211, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6545, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8775, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||: 94%|#########3| 104/111 [01:09<00:04, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9282, LAS: 0.8725, UEM: 0.5207, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.8751, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||: 97%|#########7| 108/111 [01:11<00:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7823, UAS: 0.9278, LAS: 0.8719, UEM: 0.5203, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0270, partial_loss/deprel_loss: 1.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5918, loss: 0.8791, batch_reg_loss: 0.1456, reg_loss: 0.1446 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.301 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 2.027 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - reg_loss | 0.145 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UEM | 0.520 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LAS | 0.872 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - loss | 0.879 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEM | 0.292 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UAS | 0.928 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EM | 0.782 | N/A\n", + "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Epoch duration: 0:01:14.097322\n", + "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Estimated training time remaining: 7:47:54\n", + "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Epoch 44/399\n", + "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:47:37,188 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:47:37,194 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9630, LAS: 0.9171, UEM: 0.7763, LEM: 0.5258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.5429, batch_reg_loss: 0.1456, reg_loss: 0.1456 ||: 3%|2 | 3/111 [00:02<01:23, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9468, LAS: 0.8951, UEM: 0.6389, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5384, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.7117, batch_reg_loss: 0.1457, reg_loss: 0.1456 ||: 6%|6 | 7/111 [00:04<01:16, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9520, LAS: 0.9005, UEM: 0.6665, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4527, partial_loss/deprel_loss: 0.5690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6915, loss: 0.6676, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||: 10%|9 | 11/111 [00:07<01:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9398, LAS: 0.8874, UEM: 0.6268, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8417, partial_loss/deprel_loss: 1.2189, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4893, loss: 0.7801, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||: 13%|#2 | 14/111 [00:09<01:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9389, LAS: 0.8862, UEM: 0.6093, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6420, partial_loss/deprel_loss: 0.6886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8252, loss: 0.7783, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||: 15%|#5 | 17/111 [00:11<01:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9394, LAS: 0.8866, UEM: 0.6067, LEM: 0.3482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4438, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7781, batch_reg_loss: 0.1459, reg_loss: 0.1457 ||: 18%|#8 | 20/111 [00:13<01:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8509, UAS: 0.9330, LAS: 0.8786, UEM: 0.5653, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9093, partial_loss/deprel_loss: 0.8832, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0344, loss: 0.8428, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||: 22%|##1 | 24/111 [00:16<00:59, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7874, UAS: 0.9295, LAS: 0.8749, UEM: 0.5659, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0483, partial_loss/deprel_loss: 1.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5104, loss: 0.8740, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||: 25%|##5 | 28/111 [00:18<00:56, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9314, LAS: 0.8773, UEM: 0.5799, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8907, loss: 0.8550, batch_reg_loss: 0.1461, reg_loss: 0.1458 ||: 28%|##7 | 31/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9303, LAS: 0.8762, UEM: 0.5832, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4871, partial_loss/deprel_loss: 0.5664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8632, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||: 32%|###1 | 35/111 [00:23<00:51, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9297, LAS: 0.8753, UEM: 0.5582, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6452, partial_loss/deprel_loss: 0.7188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8503, loss: 0.8698, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||: 35%|###5 | 39/111 [00:26<00:48, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9305, LAS: 0.8756, UEM: 0.5537, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7213, partial_loss/deprel_loss: 0.7833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8642, batch_reg_loss: 0.1463, reg_loss: 0.1459 ||: 38%|###7 | 42/111 [00:28<00:47, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9290, LAS: 0.8735, UEM: 0.5410, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0237, partial_loss/deprel_loss: 0.8837, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0581, loss: 0.8770, batch_reg_loss: 0.1464, reg_loss: 0.1460 ||: 41%|####1 | 46/111 [00:30<00:43, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9317, LAS: 0.8768, UEM: 0.5692, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6319, loss: 0.8508, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||: 45%|####5 | 50/111 [00:33<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9321, LAS: 0.8772, UEM: 0.5601, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5211, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7556, loss: 0.8474, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||: 49%|####8 | 54/111 [00:36<00:37, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9311, LAS: 0.8759, UEM: 0.5516, LEM: 0.3082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7685, loss: 0.8563, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||: 52%|#####2 | 58/111 [00:38<00:35, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.9310, LAS: 0.8758, UEM: 0.5487, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4201, partial_loss/deprel_loss: 1.0710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2874, loss: 0.8568, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||: 56%|#####5 | 62/111 [00:41<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9310, LAS: 0.8756, UEM: 0.5411, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8429, loss: 0.8575, batch_reg_loss: 0.1467, reg_loss: 0.1461 ||: 59%|#####8 | 65/111 [00:43<00:32, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9304, LAS: 0.8748, UEM: 0.5300, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8484, partial_loss/deprel_loss: 0.8227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8617, batch_reg_loss: 0.1467, reg_loss: 0.1462 ||: 61%|######1 | 68/111 [00:46<00:29, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9297, LAS: 0.8742, UEM: 0.5247, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5040, partial_loss/deprel_loss: 0.5522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.8663, batch_reg_loss: 0.1468, reg_loss: 0.1462 ||: 65%|######4 | 72/111 [00:48<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9296, LAS: 0.8740, UEM: 0.5207, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.5267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.8694, batch_reg_loss: 0.1469, reg_loss: 0.1462 ||: 68%|######8 | 76/111 [00:51<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9301, LAS: 0.8746, UEM: 0.5239, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4784, partial_loss/deprel_loss: 0.6309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7473, loss: 0.8649, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||: 72%|#######2 | 80/111 [00:53<00:20, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9295, LAS: 0.8739, UEM: 0.5156, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8536, partial_loss/deprel_loss: 0.8270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9793, loss: 0.8710, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||: 76%|#######5 | 84/111 [00:56<00:17, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9279, LAS: 0.8721, UEM: 0.5087, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1010, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0984, loss: 0.8855, batch_reg_loss: 0.1471, reg_loss: 0.1463 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9283, LAS: 0.8724, UEM: 0.5060, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7206, partial_loss/deprel_loss: 0.8822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9970, loss: 0.8843, batch_reg_loss: 0.1472, reg_loss: 0.1464 ||: 83%|########2 | 92/111 [01:01<00:11, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9280, LAS: 0.8721, UEM: 0.5019, LEM: 0.2653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9525, partial_loss/deprel_loss: 0.8787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0407, loss: 0.8880, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||: 86%|########6 | 96/111 [01:03<00:09, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9288, LAS: 0.8728, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0723, partial_loss/deprel_loss: 0.2095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3294, loss: 0.8826, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||: 90%|######### | 100/111 [01:07<00:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9286, LAS: 0.8726, UEM: 0.5207, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3335, partial_loss/deprel_loss: 1.0984, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2928, loss: 0.8856, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||: 93%|#########2| 103/111 [01:09<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9291, LAS: 0.8730, UEM: 0.5236, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7942, loss: 0.8808, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||: 95%|#########5| 106/111 [01:11<00:03, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9294, LAS: 0.8734, UEM: 0.5320, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1479, partial_loss/deprel_loss: 0.2737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3960, loss: 0.8765, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||: 98%|#########8| 109/111 [01:13<00:01, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9296, LAS: 0.8735, UEM: 0.5301, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.8758, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||: 100%|##########| 111/111 [01:15<00:00, 1.48it/s]\n", + "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.803 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.636 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - reg_loss | 0.147 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UEM | 0.530 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LAS | 0.873 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - loss | 0.876 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LEM | 0.297 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EM | 0.877 | N/A\n", + "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Epoch duration: 0:01:15.138417\n", + "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:06\n", + "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Epoch 45/399\n", + "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:48:52,334 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9169, LAS: 0.8645, UEM: 0.6209, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3488, partial_loss/deprel_loss: 0.4880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6077, loss: 0.9611, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||: 4%|3 | 4/111 [00:02<01:17, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9205, LAS: 0.8661, UEM: 0.6082, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7394, partial_loss/deprel_loss: 1.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4749, loss: 0.9431, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||: 6%|6 | 7/111 [00:05<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9206, LAS: 0.8646, UEM: 0.5249, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9024, loss: 0.9411, batch_reg_loss: 0.1477, reg_loss: 0.1476 ||: 10%|9 | 11/111 [00:07<01:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9248, LAS: 0.8690, UEM: 0.5142, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.7006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 0.8999, batch_reg_loss: 0.1478, reg_loss: 0.1476 ||: 13%|#2 | 14/111 [00:09<01:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9275, LAS: 0.8721, UEM: 0.5363, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.8710, batch_reg_loss: 0.1478, reg_loss: 0.1477 ||: 15%|#5 | 17/111 [00:11<01:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9285, LAS: 0.8730, UEM: 0.5128, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.6489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8690, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||: 18%|#8 | 20/111 [00:13<01:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9269, LAS: 0.8713, UEM: 0.4956, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9929, partial_loss/deprel_loss: 0.9136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0774, loss: 0.8785, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||: 21%|## | 23/111 [00:15<01:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9277, LAS: 0.8720, UEM: 0.4875, LEM: 0.2508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7347, partial_loss/deprel_loss: 0.7592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9022, loss: 0.8687, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9321, LAS: 0.8777, UEM: 0.5737, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.5158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6243, loss: 0.8307, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||: 26%|##6 | 29/111 [00:21<01:05, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9321, LAS: 0.8777, UEM: 0.5882, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.5867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7080, loss: 0.8318, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||: 30%|##9 | 33/111 [00:23<00:58, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9305, LAS: 0.8756, UEM: 0.5741, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9509, loss: 0.8478, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||: 32%|###2 | 36/111 [00:25<00:54, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9317, LAS: 0.8763, UEM: 0.5771, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 0.8313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.8396, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||: 35%|###5 | 39/111 [00:27<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9338, LAS: 0.8790, UEM: 0.5864, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3781, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6742, loss: 0.8236, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||: 39%|###8 | 43/111 [00:30<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9320, LAS: 0.8768, UEM: 0.5703, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1642, partial_loss/deprel_loss: 0.9447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1368, loss: 0.8393, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||: 41%|####1 | 46/111 [00:32<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9331, LAS: 0.8779, UEM: 0.5812, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4418, loss: 0.8277, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||: 44%|####4 | 49/111 [00:34<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9328, LAS: 0.8772, UEM: 0.5853, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1467, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4954, loss: 0.8332, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||: 47%|####6 | 52/111 [00:36<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9322, LAS: 0.8766, UEM: 0.5773, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2362, partial_loss/deprel_loss: 0.9801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1798, loss: 0.8400, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||: 50%|####9 | 55/111 [00:38<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9298, LAS: 0.8743, UEM: 0.5684, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3632, partial_loss/deprel_loss: 0.4450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5771, loss: 0.8590, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||: 53%|#####3 | 59/111 [00:41<00:37, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9287, LAS: 0.8731, UEM: 0.5648, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8692, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||: 56%|#####5 | 62/111 [00:44<00:35, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9284, LAS: 0.8725, UEM: 0.5539, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2580, partial_loss/deprel_loss: 1.0314, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2254, loss: 0.8760, batch_reg_loss: 0.1486, reg_loss: 0.1481 ||: 59%|#####9 | 66/111 [00:46<00:31, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9278, LAS: 0.8719, UEM: 0.5486, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4298, partial_loss/deprel_loss: 0.9430, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1891, loss: 0.8808, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||: 62%|######2 | 69/111 [00:48<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9270, LAS: 0.8709, UEM: 0.5420, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6441, partial_loss/deprel_loss: 0.6258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7782, loss: 0.8877, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||: 65%|######4 | 72/111 [00:50<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9276, LAS: 0.8713, UEM: 0.5411, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4335, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7481, loss: 0.8853, batch_reg_loss: 0.1488, reg_loss: 0.1482 ||: 68%|######8 | 76/111 [00:53<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8540, UAS: 0.9268, LAS: 0.8706, UEM: 0.5445, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9930, loss: 0.8901, batch_reg_loss: 0.1489, reg_loss: 0.1482 ||: 71%|#######1 | 79/111 [00:55<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9272, LAS: 0.8709, UEM: 0.5434, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.8875, batch_reg_loss: 0.1490, reg_loss: 0.1482 ||: 74%|#######3 | 82/111 [00:58<00:21, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9271, LAS: 0.8708, UEM: 0.5359, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1788, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1667, loss: 0.8887, batch_reg_loss: 0.1490, reg_loss: 0.1483 ||: 77%|#######7 | 86/111 [01:00<00:17, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9264, LAS: 0.8700, UEM: 0.5294, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1285, partial_loss/deprel_loss: 1.1447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2905, loss: 0.8945, batch_reg_loss: 0.1491, reg_loss: 0.1483 ||: 81%|########1 | 90/111 [01:02<00:13, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9266, LAS: 0.8703, UEM: 0.5230, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9470, partial_loss/deprel_loss: 0.7802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9627, loss: 0.8945, batch_reg_loss: 0.1492, reg_loss: 0.1483 ||: 85%|########4 | 94/111 [01:05<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9273, LAS: 0.8712, UEM: 0.5234, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2959, partial_loss/deprel_loss: 0.5120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6180, loss: 0.8880, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||: 88%|########8 | 98/111 [01:07<00:08, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9275, LAS: 0.8714, UEM: 0.5286, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2757, partial_loss/deprel_loss: 0.9351, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8843, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||: 92%|#########1| 102/111 [01:10<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9280, LAS: 0.8719, UEM: 0.5266, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.5887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7234, loss: 0.8805, batch_reg_loss: 0.1494, reg_loss: 0.1484 ||: 95%|#########5| 106/111 [01:13<00:03, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8724, UEM: 0.5281, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6144, loss: 0.8774, batch_reg_loss: 0.1494, reg_loss: 0.1485 ||: 99%|#########9| 110/111 [01:16<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9282, LAS: 0.8720, UEM: 0.5259, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1604, partial_loss/deprel_loss: 1.0838, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8807, batch_reg_loss: 0.1495, reg_loss: 0.1485 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-06 23:50:09,062 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9534, LAS: 0.9001, UEM: 0.6753, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 23.7693, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0518, loss: 22.2928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9487, LAS: 0.8920, UEM: 0.6040, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 37.4935, partial_loss/cycle_loss: 0.0000, batch_loss: 30.1930, loss: 23.5104, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9415, LAS: 0.8858, UEM: 0.5706, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 31.2307, partial_loss/cycle_loss: 0.0000, batch_loss: 25.1649, loss: 25.3184, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:07<00:03, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9419, LAS: 0.8882, UEM: 0.6289, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 20.7598, partial_loss/cycle_loss: 0.0000, batch_loss: 16.6462, loss: 25.8303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:09<00:01, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00, 1.09it/s]\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.084 | 43.748\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.160 | 1.059\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - reg_loss | 0.148 | 0.000\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UEM | 0.526 | 0.623\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - LAS | 0.872 | 0.888\n", + "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - loss | 0.881 | 26.207\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEM | 0.296 | 0.363\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - UAS | 0.928 | 0.942\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EM | 0.828 | 0.868\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:50:21,017 - INFO - combo.training.trainer - Epoch duration: 0:01:28.691575\n", + "2023-04-06 23:50:21,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:03\n", + "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Epoch 46/399\n", + "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:50:21,024 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9393, LAS: 0.8848, UEM: 0.7867, LEM: 0.5840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1217, partial_loss/deprel_loss: 0.2555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3782, loss: 0.7494, batch_reg_loss: 0.1495, reg_loss: 0.1495 ||: 3%|2 | 3/111 [00:02<01:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8622, UAS: 0.9277, LAS: 0.8710, UEM: 0.5986, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7870, partial_loss/deprel_loss: 0.9187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8931, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||: 6%|6 | 7/111 [00:04<01:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9300, LAS: 0.8734, UEM: 0.5550, LEM: 0.3467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.5726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.8855, batch_reg_loss: 0.1496, reg_loss: 0.1496 ||: 10%|9 | 11/111 [00:06<01:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9345, LAS: 0.8780, UEM: 0.5825, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.8413, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||: 13%|#2 | 14/111 [00:08<01:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9332, LAS: 0.8768, UEM: 0.5385, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9611, partial_loss/deprel_loss: 0.9256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0825, loss: 0.8551, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||: 16%|#6 | 18/111 [00:11<01:00, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9320, LAS: 0.8767, UEM: 0.5975, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0807, partial_loss/deprel_loss: 0.1996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3256, loss: 0.8484, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||: 20%|#9 | 22/111 [00:14<01:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9341, LAS: 0.8794, UEM: 0.5979, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4832, partial_loss/deprel_loss: 0.6899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.8280, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||: 23%|##2 | 25/111 [00:16<00:58, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9348, LAS: 0.8796, UEM: 0.5840, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3874, partial_loss/deprel_loss: 0.6064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.8244, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||: 26%|##6 | 29/111 [00:19<00:55, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9347, LAS: 0.8794, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5306, partial_loss/deprel_loss: 0.5927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7302, loss: 0.8259, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||: 29%|##8 | 32/111 [00:21<00:53, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8763, UEM: 0.5530, LEM: 0.3312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5293, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7681, loss: 0.8487, batch_reg_loss: 0.1500, reg_loss: 0.1498 ||: 32%|###2 | 36/111 [00:23<00:49, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9328, LAS: 0.8771, UEM: 0.5633, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1378, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4359, loss: 0.8430, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||: 35%|###5 | 39/111 [00:25<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9319, LAS: 0.8759, UEM: 0.5512, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.8529, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||: 39%|###8 | 43/111 [00:28<00:45, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9323, LAS: 0.8762, UEM: 0.5401, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4595, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6904, loss: 0.8498, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||: 42%|####2 | 47/111 [00:30<00:41, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9327, LAS: 0.8767, UEM: 0.5498, LEM: 0.3266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0265, partial_loss/deprel_loss: 0.8848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0634, loss: 0.8436, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||: 46%|####5 | 51/111 [00:33<00:38, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9336, LAS: 0.8777, UEM: 0.5578, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9532, partial_loss/deprel_loss: 0.9401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0931, loss: 0.8347, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||: 50%|####9 | 55/111 [00:35<00:35, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8091, UAS: 0.9310, LAS: 0.8748, UEM: 0.5446, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6452, partial_loss/deprel_loss: 1.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3576, loss: 0.8591, batch_reg_loss: 0.1504, reg_loss: 0.1499 ||: 53%|#####3 | 59/111 [00:38<00:32, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9295, LAS: 0.8733, UEM: 0.5337, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.6523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7787, loss: 0.8732, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||: 57%|#####6 | 63/111 [00:40<00:30, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9297, LAS: 0.8738, UEM: 0.5323, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 0.4510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5713, loss: 0.8672, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||: 60%|###### | 67/111 [00:43<00:28, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9302, LAS: 0.8744, UEM: 0.5323, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.8616, batch_reg_loss: 0.1506, reg_loss: 0.1500 ||: 64%|######3 | 71/111 [00:46<00:26, 1.51it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9310, LAS: 0.8752, UEM: 0.5322, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.6015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.8551, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||: 68%|######7 | 75/111 [00:49<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9300, LAS: 0.8740, UEM: 0.5275, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3972, partial_loss/deprel_loss: 0.5661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.8679, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||: 71%|#######1 | 79/111 [00:51<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9278, LAS: 0.8714, UEM: 0.5172, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6741, partial_loss/deprel_loss: 1.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4435, loss: 0.8901, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||: 75%|#######4 | 83/111 [00:54<00:18, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9281, LAS: 0.8717, UEM: 0.5223, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3916, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.8872, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||: 78%|#######8 | 87/111 [00:57<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9278, LAS: 0.8714, UEM: 0.5150, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.8900, batch_reg_loss: 0.1510, reg_loss: 0.1502 ||: 82%|########1 | 91/111 [00:59<00:13, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9279, LAS: 0.8717, UEM: 0.5151, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3055, partial_loss/deprel_loss: 0.9726, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1902, loss: 0.8875, batch_reg_loss: 0.1511, reg_loss: 0.1502 ||: 86%|########5 | 95/111 [01:01<00:10, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9284, LAS: 0.8722, UEM: 0.5175, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1813, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5253, loss: 0.8842, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||: 89%|########9 | 99/111 [01:04<00:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9288, LAS: 0.8727, UEM: 0.5197, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.8797, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||: 93%|#########2| 103/111 [01:07<00:05, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7736, UAS: 0.9286, LAS: 0.8725, UEM: 0.5249, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1080, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6937, loss: 0.8808, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||: 96%|#########6| 107/111 [01:10<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9285, LAS: 0.8723, UEM: 0.5211, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4362, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6656, loss: 0.8816, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||: 99%|#########9| 110/111 [01:12<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9286, LAS: 0.8724, UEM: 0.5211, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5446, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7395, loss: 0.8803, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.599 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.545 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - reg_loss | 0.150 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - UEM | 0.521 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LAS | 0.872 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - loss | 0.880 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEM | 0.294 | N/A\n", + "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EM | 0.890 | N/A\n", + "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Epoch duration: 0:01:13.468063\n", + "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Estimated training time remaining: 7:44:03\n", + "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Epoch 47/399\n", + "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:51:34,487 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:51:34,497 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9484, LAS: 0.8921, UEM: 0.5152, LEM: 0.2265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7989, loss: 0.7461, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||: 4%|3 | 4/111 [00:02<01:05, 1.63it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9466, LAS: 0.8903, UEM: 0.5488, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4419, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7649, loss: 0.7337, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||: 6%|6 | 7/111 [00:04<01:10, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9452, LAS: 0.8893, UEM: 0.5505, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.7389, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||: 9%|9 | 10/111 [00:07<01:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9440, LAS: 0.8878, UEM: 0.5283, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8270, partial_loss/deprel_loss: 0.9081, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0434, loss: 0.7611, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||: 12%|#1 | 13/111 [00:09<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9360, LAS: 0.8785, UEM: 0.4933, LEM: 0.2363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.8289, batch_reg_loss: 0.1516, reg_loss: 0.1515 ||: 15%|#5 | 17/111 [00:11<01:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9351, LAS: 0.8776, UEM: 0.4647, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5660, partial_loss/deprel_loss: 0.6389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7760, loss: 0.8371, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||: 19%|#8 | 21/111 [00:13<00:57, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9373, LAS: 0.8812, UEM: 0.4902, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5451, loss: 0.8146, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||: 22%|##1 | 24/111 [00:16<00:57, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9377, LAS: 0.8817, UEM: 0.5209, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.8096, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||: 24%|##4 | 27/111 [00:18<00:55, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.9377, LAS: 0.8823, UEM: 0.5501, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4170, partial_loss/deprel_loss: 1.0259, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2560, loss: 0.8059, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||: 28%|##7 | 31/111 [00:20<00:52, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9379, LAS: 0.8831, UEM: 0.5481, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3535, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5592, loss: 0.8039, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||: 31%|### | 34/111 [00:22<00:51, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9348, LAS: 0.8797, UEM: 0.5299, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1099, partial_loss/deprel_loss: 1.1716, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3112, loss: 0.8368, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||: 33%|###3 | 37/111 [00:24<00:49, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9310, LAS: 0.8754, UEM: 0.5079, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8518, partial_loss/deprel_loss: 0.8380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.8694, batch_reg_loss: 0.1520, reg_loss: 0.1517 ||: 37%|###6 | 41/111 [00:27<00:46, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8168, UAS: 0.9289, LAS: 0.8730, UEM: 0.4885, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4595, partial_loss/deprel_loss: 1.1418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3574, loss: 0.8871, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||: 41%|#### | 45/111 [00:29<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9281, LAS: 0.8723, UEM: 0.4868, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7761, loss: 0.8943, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||: 44%|####4 | 49/111 [00:32<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9272, LAS: 0.8714, UEM: 0.4838, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.9020, batch_reg_loss: 0.1522, reg_loss: 0.1518 ||: 47%|####6 | 52/111 [00:34<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9289, LAS: 0.8733, UEM: 0.5055, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2791, partial_loss/deprel_loss: 0.4182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5426, loss: 0.8857, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||: 50%|####9 | 55/111 [00:37<00:39, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9281, LAS: 0.8722, UEM: 0.4949, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.7573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8954, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||: 52%|#####2 | 58/111 [00:39<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9273, LAS: 0.8712, UEM: 0.4849, LEM: 0.2654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5280, partial_loss/deprel_loss: 0.7407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8505, loss: 0.9024, batch_reg_loss: 0.1524, reg_loss: 0.1518 ||: 55%|#####4 | 61/111 [00:41<00:34, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9278, LAS: 0.8717, UEM: 0.4898, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3571, partial_loss/deprel_loss: 0.5670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6775, loss: 0.8988, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||: 59%|#####8 | 65/111 [00:43<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9284, LAS: 0.8724, UEM: 0.4908, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7764, partial_loss/deprel_loss: 0.8388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9789, loss: 0.8927, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||: 61%|######1 | 68/111 [00:45<00:29, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9291, LAS: 0.8732, UEM: 0.5030, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.3870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.8876, batch_reg_loss: 0.1526, reg_loss: 0.1519 ||: 64%|######3 | 71/111 [00:48<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9283, LAS: 0.8722, UEM: 0.4949, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9420, partial_loss/deprel_loss: 0.8445, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.8945, batch_reg_loss: 0.1526, reg_loss: 0.1520 ||: 68%|######7 | 75/111 [00:50<00:24, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9281, LAS: 0.8719, UEM: 0.4908, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4672, partial_loss/deprel_loss: 0.6235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 0.8979, batch_reg_loss: 0.1527, reg_loss: 0.1520 ||: 71%|#######1 | 79/111 [00:53<00:21, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9287, LAS: 0.8727, UEM: 0.4885, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5525, partial_loss/deprel_loss: 0.6233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.8915, batch_reg_loss: 0.1528, reg_loss: 0.1520 ||: 75%|#######4 | 83/111 [00:55<00:18, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9288, LAS: 0.8729, UEM: 0.4905, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6938, partial_loss/deprel_loss: 0.7008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 0.8901, batch_reg_loss: 0.1528, reg_loss: 0.1521 ||: 78%|#######8 | 87/111 [00:58<00:15, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9289, LAS: 0.8732, UEM: 0.4935, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8700, partial_loss/deprel_loss: 0.8386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9978, loss: 0.8883, batch_reg_loss: 0.1529, reg_loss: 0.1521 ||: 82%|########1 | 91/111 [01:01<00:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9280, LAS: 0.8724, UEM: 0.4954, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2556, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.8933, batch_reg_loss: 0.1530, reg_loss: 0.1521 ||: 85%|########4 | 94/111 [01:03<00:11, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9289, LAS: 0.8735, UEM: 0.5164, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3088, loss: 0.8856, batch_reg_loss: 0.1530, reg_loss: 0.1522 ||: 87%|########7 | 97/111 [01:06<00:10, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9289, LAS: 0.8735, UEM: 0.5153, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3051, partial_loss/deprel_loss: 0.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.8855, batch_reg_loss: 0.1531, reg_loss: 0.1522 ||: 91%|######### | 101/111 [01:08<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9299, LAS: 0.8746, UEM: 0.5268, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.3871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.8753, batch_reg_loss: 0.1532, reg_loss: 0.1522 ||: 95%|#########4| 105/111 [01:10<00:03, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9301, LAS: 0.8749, UEM: 0.5290, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2639, partial_loss/deprel_loss: 0.4698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.8739, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||: 98%|#########8| 109/111 [01:12<00:01, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9302, LAS: 0.8748, UEM: 0.5266, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7826, partial_loss/deprel_loss: 0.8032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8742, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.803 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.783 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - reg_loss | 0.152 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UEM | 0.527 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - loss | 0.874 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEM | 0.301 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - EM | 0.861 | N/A\n", + "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Epoch duration: 0:01:14.095098\n", + "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Estimated training time remaining: 7:42:09\n", + "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Epoch 48/399\n", + "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:52:48,582 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:52:48,587 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9342, LAS: 0.8798, UEM: 0.4156, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4324, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.8418, batch_reg_loss: 0.1533, reg_loss: 0.1533 ||: 4%|3 | 4/111 [00:02<01:08, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9253, LAS: 0.8706, UEM: 0.3450, LEM: 0.1517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0604, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0111, loss: 0.9093, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||: 7%|7 | 8/111 [00:04<01:04, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9315, LAS: 0.8776, UEM: 0.5266, LEM: 0.3168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9183, partial_loss/deprel_loss: 0.9036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0599, loss: 0.8473, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||: 10%|9 | 11/111 [00:07<01:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9278, LAS: 0.8743, UEM: 0.5129, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9617, partial_loss/deprel_loss: 0.8241, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0050, loss: 0.8777, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||: 13%|#2 | 14/111 [00:09<01:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9300, LAS: 0.8761, UEM: 0.5064, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 0.8143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9571, loss: 0.8568, batch_reg_loss: 0.1535, reg_loss: 0.1534 ||: 16%|#6 | 18/111 [00:12<01:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9269, LAS: 0.8725, UEM: 0.4682, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0474, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0588, loss: 0.8885, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||: 20%|#9 | 22/111 [00:14<00:58, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9289, LAS: 0.8747, UEM: 0.4699, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4745, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.8740, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||: 23%|##3 | 26/111 [00:16<00:54, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9288, LAS: 0.8747, UEM: 0.4876, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.8699, batch_reg_loss: 0.1537, reg_loss: 0.1535 ||: 27%|##7 | 30/111 [00:19<00:52, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9319, LAS: 0.8781, UEM: 0.5407, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4285, loss: 0.8452, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||: 30%|##9 | 33/111 [00:21<00:53, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9313, LAS: 0.8776, UEM: 0.5379, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.5909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7208, loss: 0.8510, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||: 33%|###3 | 37/111 [00:24<00:49, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9324, LAS: 0.8791, UEM: 0.5453, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3170, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.8379, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||: 36%|###6 | 40/111 [00:26<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9319, LAS: 0.8783, UEM: 0.5334, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5949, partial_loss/deprel_loss: 0.6138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8391, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||: 39%|###8 | 43/111 [00:28<00:47, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9336, LAS: 0.8803, UEM: 0.5564, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.8227, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||: 41%|####1 | 46/111 [00:31<00:46, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9314, LAS: 0.8775, UEM: 0.5413, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7306, loss: 0.8463, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||: 45%|####5 | 50/111 [00:33<00:42, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9315, LAS: 0.8776, UEM: 0.5407, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4884, loss: 0.8460, batch_reg_loss: 0.1541, reg_loss: 0.1537 ||: 48%|####7 | 53/111 [00:35<00:40, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9324, LAS: 0.8785, UEM: 0.5441, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.8389, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||: 51%|#####1 | 57/111 [00:38<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9316, LAS: 0.8776, UEM: 0.5364, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6206, partial_loss/deprel_loss: 0.7314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.8457, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||: 54%|#####4 | 60/111 [00:40<00:35, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9304, LAS: 0.8762, UEM: 0.5293, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1126, partial_loss/deprel_loss: 1.3161, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6297, loss: 0.8591, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9300, LAS: 0.8758, UEM: 0.5307, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2438, partial_loss/deprel_loss: 0.3579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.8597, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||: 60%|###### | 67/111 [00:45<00:30, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9313, LAS: 0.8773, UEM: 0.5548, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0642, partial_loss/deprel_loss: 0.1699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3031, loss: 0.8491, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||: 63%|######3 | 70/111 [00:47<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9314, LAS: 0.8771, UEM: 0.5535, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1907, partial_loss/deprel_loss: 1.0234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2113, loss: 0.8511, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||: 66%|######5 | 73/111 [00:50<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9308, LAS: 0.8763, UEM: 0.5414, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5767, partial_loss/deprel_loss: 0.7398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.8574, batch_reg_loss: 0.1545, reg_loss: 0.1539 ||: 69%|######9 | 77/111 [00:52<00:24, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9307, LAS: 0.8762, UEM: 0.5364, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4993, partial_loss/deprel_loss: 0.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7621, loss: 0.8571, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||: 73%|#######2 | 81/111 [00:54<00:20, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9312, LAS: 0.8766, UEM: 0.5370, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.6207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7389, loss: 0.8523, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||: 76%|#######5 | 84/111 [00:57<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9312, LAS: 0.8766, UEM: 0.5312, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7141, partial_loss/deprel_loss: 0.6809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8422, loss: 0.8526, batch_reg_loss: 0.1547, reg_loss: 0.1539 ||: 78%|#######8 | 87/111 [00:59<00:16, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9298, LAS: 0.8751, UEM: 0.5309, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1345, partial_loss/deprel_loss: 0.9797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1654, loss: 0.8649, batch_reg_loss: 0.1547, reg_loss: 0.1540 ||: 81%|########1 | 90/111 [01:01<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9301, LAS: 0.8755, UEM: 0.5403, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.6702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.8621, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||: 84%|########3 | 93/111 [01:03<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8038, UAS: 0.9290, LAS: 0.8744, UEM: 0.5343, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9209, partial_loss/deprel_loss: 1.1134, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4297, loss: 0.8719, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||: 86%|########6 | 96/111 [01:05<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9294, LAS: 0.8747, UEM: 0.5321, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3043, partial_loss/deprel_loss: 0.5841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.8683, batch_reg_loss: 0.1549, reg_loss: 0.1541 ||: 90%|######### | 100/111 [01:08<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9285, LAS: 0.8737, UEM: 0.5242, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1519, partial_loss/deprel_loss: 0.9448, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1412, loss: 0.8762, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||: 94%|#########3| 104/111 [01:10<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8734, UEM: 0.5209, LEM: 0.2983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.4996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 0.8786, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||: 97%|#########7| 108/111 [01:13<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9289, LAS: 0.8740, UEM: 0.5235, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6249, loss: 0.8731, batch_reg_loss: 0.1551, reg_loss: 0.1542 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.499 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.354 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - reg_loss | 0.154 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UEM | 0.523 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LAS | 0.874 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - loss | 0.873 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LEM | 0.298 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EM | 0.896 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Epoch duration: 0:01:15.561956\n", + "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Estimated training time remaining: 7:40:27\n", + "2023-04-06 23:54:04,143 - INFO - allennlp.training.trainer - Epoch 49/399\n", + "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:54:04,149 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8954, LAS: 0.8373, UEM: 0.3531, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9718, partial_loss/deprel_loss: 1.1487, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4685, loss: 1.1159, batch_reg_loss: 0.1552, reg_loss: 0.1552 ||: 4%|3 | 4/111 [00:02<01:10, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9175, LAS: 0.8616, UEM: 0.4567, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3460, partial_loss/deprel_loss: 0.4872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.9446, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||: 7%|7 | 8/111 [00:05<01:06, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9264, LAS: 0.8697, UEM: 0.5122, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8896, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||: 10%|9 | 11/111 [00:07<01:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8149, UAS: 0.9191, LAS: 0.8626, UEM: 0.4610, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7589, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3545, loss: 0.9608, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||: 14%|#3 | 15/111 [00:09<01:02, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9214, LAS: 0.8657, UEM: 0.4965, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1912, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4782, loss: 0.9304, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||: 17%|#7 | 19/111 [00:12<00:58, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9223, LAS: 0.8664, UEM: 0.4895, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3587, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.9235, batch_reg_loss: 0.1555, reg_loss: 0.1553 ||: 21%|## | 23/111 [00:14<00:57, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9252, LAS: 0.8696, UEM: 0.4974, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.8980, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||: 24%|##4 | 27/111 [00:17<00:54, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9248, LAS: 0.8688, UEM: 0.4822, LEM: 0.2448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9313, partial_loss/deprel_loss: 0.9207, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0785, loss: 0.9065, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||: 27%|##7 | 30/111 [00:19<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9285, LAS: 0.8729, UEM: 0.5310, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.8737, batch_reg_loss: 0.1557, reg_loss: 0.1554 ||: 30%|##9 | 33/111 [00:22<00:55, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8746, UEM: 0.5256, LEM: 0.2821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6425, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8591, batch_reg_loss: 0.1558, reg_loss: 0.1554 ||: 33%|###3 | 37/111 [00:24<00:50, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9294, LAS: 0.8742, UEM: 0.5161, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.8647, batch_reg_loss: 0.1558, reg_loss: 0.1555 ||: 37%|###6 | 41/111 [00:26<00:44, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9300, LAS: 0.8749, UEM: 0.5093, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6331, partial_loss/deprel_loss: 0.7067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.8596, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||: 41%|#### | 45/111 [00:29<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9313, LAS: 0.8765, UEM: 0.5172, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2331, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.8482, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||: 44%|####4 | 49/111 [00:31<00:39, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9308, LAS: 0.8760, UEM: 0.5255, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.5428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6545, loss: 0.8538, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||: 48%|####7 | 53/111 [00:34<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8748, UEM: 0.5237, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.6295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.8677, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||: 50%|##### | 56/111 [00:37<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9301, LAS: 0.8753, UEM: 0.5200, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8050, loss: 0.8635, batch_reg_loss: 0.1561, reg_loss: 0.1556 ||: 53%|#####3 | 59/111 [00:39<00:36, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9304, LAS: 0.8758, UEM: 0.5333, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1874, partial_loss/deprel_loss: 0.3743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.8582, batch_reg_loss: 0.1561, reg_loss: 0.1557 ||: 56%|#####5 | 62/111 [00:41<00:35, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9301, LAS: 0.8755, UEM: 0.5277, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3650, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6708, loss: 0.8625, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||: 59%|#####8 | 65/111 [00:43<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9311, LAS: 0.8764, UEM: 0.5335, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5554, partial_loss/deprel_loss: 0.6621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7970, loss: 0.8548, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||: 61%|######1 | 68/111 [00:46<00:32, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9304, LAS: 0.8755, UEM: 0.5226, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8234, partial_loss/deprel_loss: 0.7134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8917, loss: 0.8620, batch_reg_loss: 0.1563, reg_loss: 0.1557 ||: 65%|######4 | 72/111 [00:48<00:28, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9302, LAS: 0.8751, UEM: 0.5187, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4144, partial_loss/deprel_loss: 1.0153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2515, loss: 0.8652, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||: 68%|######8 | 76/111 [00:51<00:24, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9312, LAS: 0.8763, UEM: 0.5408, LEM: 0.2998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4109, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6977, loss: 0.8563, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||: 71%|#######1 | 79/111 [00:54<00:24, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9311, LAS: 0.8763, UEM: 0.5334, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 0.8572, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8287, UAS: 0.9302, LAS: 0.8752, UEM: 0.5287, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3085, partial_loss/deprel_loss: 1.0597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8685, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||: 78%|#######8 | 87/111 [00:58<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9299, LAS: 0.8749, UEM: 0.5339, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4365, loss: 0.8724, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||: 81%|########1 | 90/111 [01:01<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9307, LAS: 0.8758, UEM: 0.5454, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7527, partial_loss/deprel_loss: 0.7827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9333, loss: 0.8654, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||: 84%|########3 | 93/111 [01:03<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9312, LAS: 0.8764, UEM: 0.5440, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8018, partial_loss/deprel_loss: 0.8328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9833, loss: 0.8617, batch_reg_loss: 0.1567, reg_loss: 0.1559 ||: 87%|########7 | 97/111 [01:05<00:09, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9300, LAS: 0.8753, UEM: 0.5369, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5177, partial_loss/deprel_loss: 0.6388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.8700, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||: 91%|######### | 101/111 [01:07<00:06, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9295, LAS: 0.8746, UEM: 0.5288, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8003, partial_loss/deprel_loss: 0.8681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0114, loss: 0.8759, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||: 95%|#########4| 105/111 [01:10<00:03, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9292, LAS: 0.8742, UEM: 0.5270, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8836, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9858, loss: 0.8781, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||: 98%|#########8| 109/111 [01:12<00:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9294, LAS: 0.8745, UEM: 0.5276, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2578, partial_loss/deprel_loss: 0.4366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5578, loss: 0.8755, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.437 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.258 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - reg_loss | 0.156 | N/A\n", + "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UEM | 0.528 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LAS | 0.874 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - loss | 0.876 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEM | 0.297 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - UAS | 0.929 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EM | 0.914 | N/A\n", + "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Epoch duration: 0:01:14.403031\n", + "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:38\n", + "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Epoch 50/399\n", + "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:55:18,553 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9290, LAS: 0.8760, UEM: 0.5054, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 0.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8502, batch_reg_loss: 0.1570, reg_loss: 0.1570 ||: 3%|2 | 3/111 [00:02<01:19, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9221, LAS: 0.8702, UEM: 0.4812, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.8912, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||: 6%|6 | 7/111 [00:04<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9285, LAS: 0.8777, UEM: 0.5969, LEM: 0.3922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5646, loss: 0.8423, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||: 9%|9 | 10/111 [00:07<01:17, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9283, LAS: 0.8774, UEM: 0.5628, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8468, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||: 12%|#1 | 13/111 [00:09<01:12, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8716, UAS: 0.9320, LAS: 0.8807, UEM: 0.5504, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7563, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8744, loss: 0.8170, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||: 15%|#5 | 17/111 [00:12<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9309, LAS: 0.8794, UEM: 0.5287, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7209, partial_loss/deprel_loss: 0.7438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8965, loss: 0.8283, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||: 18%|#8 | 20/111 [00:14<01:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.9249, LAS: 0.8730, UEM: 0.4993, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9332, partial_loss/deprel_loss: 1.1208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4406, loss: 0.8825, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||: 21%|## | 23/111 [00:16<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9282, LAS: 0.8763, UEM: 0.5111, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5482, loss: 0.8626, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||: 24%|##4 | 27/111 [00:18<00:56, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9296, LAS: 0.8774, UEM: 0.5096, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7129, partial_loss/deprel_loss: 0.7503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9003, loss: 0.8551, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||: 27%|##7 | 30/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9288, LAS: 0.8761, UEM: 0.5080, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2659, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5213, loss: 0.8652, batch_reg_loss: 0.1575, reg_loss: 0.1572 ||: 31%|### | 34/111 [00:23<00:52, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9288, LAS: 0.8758, UEM: 0.5034, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5541, partial_loss/deprel_loss: 0.7148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8402, loss: 0.8701, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||: 33%|###3 | 37/111 [00:25<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9306, LAS: 0.8774, UEM: 0.5220, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1300, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.8589, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||: 36%|###6 | 40/111 [00:27<00:49, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9289, LAS: 0.8753, UEM: 0.5036, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1688, partial_loss/deprel_loss: 0.8952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1076, loss: 0.8755, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||: 40%|###9 | 44/111 [00:30<00:45, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9303, LAS: 0.8768, UEM: 0.5211, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.6167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.8604, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||: 42%|####2 | 47/111 [00:32<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9302, LAS: 0.8764, UEM: 0.5122, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8860, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.8628, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||: 45%|####5 | 50/111 [00:34<00:41, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7913, UAS: 0.9295, LAS: 0.8755, UEM: 0.5144, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9336, partial_loss/deprel_loss: 1.3001, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5847, loss: 0.8703, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||: 48%|####7 | 53/111 [00:37<00:42, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9300, LAS: 0.8766, UEM: 0.5481, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5420, partial_loss/deprel_loss: 1.0670, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3199, loss: 0.8646, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||: 50%|##### | 56/111 [00:39<00:40, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9297, LAS: 0.8761, UEM: 0.5495, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8045, partial_loss/deprel_loss: 1.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5423, loss: 0.8670, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||: 54%|#####4 | 60/111 [00:42<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9289, LAS: 0.8751, UEM: 0.5481, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.5128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6284, loss: 0.8746, batch_reg_loss: 0.1580, reg_loss: 0.1575 ||: 57%|#####6 | 63/111 [00:44<00:34, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9290, LAS: 0.8750, UEM: 0.5390, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.5525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8767, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||: 60%|###### | 67/111 [00:46<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9295, LAS: 0.8755, UEM: 0.5369, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3454, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.8744, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||: 64%|######3 | 71/111 [00:49<00:26, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9296, LAS: 0.8755, UEM: 0.5377, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0116, partial_loss/deprel_loss: 1.0316, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1858, loss: 0.8755, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||: 67%|######6 | 74/111 [00:51<00:25, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9294, LAS: 0.8754, UEM: 0.5309, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8416, partial_loss/deprel_loss: 0.7885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9573, loss: 0.8776, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||: 70%|####### | 78/111 [00:53<00:21, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9293, LAS: 0.8752, UEM: 0.5232, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9259, partial_loss/deprel_loss: 0.9234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.8784, batch_reg_loss: 0.1583, reg_loss: 0.1576 ||: 74%|#######3 | 82/111 [00:55<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9294, LAS: 0.8752, UEM: 0.5207, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.4930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6093, loss: 0.8777, batch_reg_loss: 0.1583, reg_loss: 0.1577 ||: 77%|#######7 | 86/111 [00:58<00:15, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8559, UAS: 0.9291, LAS: 0.8750, UEM: 0.5146, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1339, partial_loss/deprel_loss: 0.9053, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1094, loss: 0.8806, batch_reg_loss: 0.1584, reg_loss: 0.1577 ||: 81%|########1 | 90/111 [01:01<00:13, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9299, LAS: 0.8757, UEM: 0.5307, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.8738, batch_reg_loss: 0.1585, reg_loss: 0.1577 ||: 85%|########4 | 94/111 [01:04<00:11, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9301, LAS: 0.8760, UEM: 0.5314, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.8717, batch_reg_loss: 0.1585, reg_loss: 0.1578 ||: 87%|########7 | 97/111 [01:06<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9302, LAS: 0.8758, UEM: 0.5269, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5324, partial_loss/deprel_loss: 0.6760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.8718, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||: 91%|######### | 101/111 [01:08<00:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9307, LAS: 0.8763, UEM: 0.5341, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2046, partial_loss/deprel_loss: 0.4037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5225, loss: 0.8681, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||: 95%|#########4| 105/111 [01:11<00:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9308, LAS: 0.8765, UEM: 0.5314, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5598, partial_loss/deprel_loss: 0.6800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.8667, batch_reg_loss: 0.1587, reg_loss: 0.1578 ||: 97%|#########7| 108/111 [01:13<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-06 23:56:34,705 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9351, LAS: 0.8773, UEM: 0.4018, LEM: 0.1232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6037, partial_loss/deprel_loss: 24.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 19.8878, loss: 28.6320, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9493, LAS: 0.8951, UEM: 0.6527, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 26.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 21.3933, loss: 25.2934, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:07, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9439, LAS: 0.8897, UEM: 0.5984, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 49.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 39.9738, loss: 26.4770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.9402, LAS: 0.8860, UEM: 0.5746, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6577, partial_loss/deprel_loss: 58.9864, partial_loss/cycle_loss: 0.0000, batch_loss: 47.5206, loss: 27.0998, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:09<00:01, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9427, LAS: 0.8904, UEM: 0.6365, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 35.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 28.2055, loss: 26.3856, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00, 1.10it/s]\n", + "2023-04-06 23:56:46,535 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.436 | 35.093\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.288 | 0.655\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - reg_loss | 0.158 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UEM | 0.532 | 0.636\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LAS | 0.876 | 0.890\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - loss | 0.872 | 26.386\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEM | 0.305 | 0.375\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | 0.943\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - EM | 0.911 | 0.885\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Epoch duration: 0:01:27.990431\n", + "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:24\n", + "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Epoch 51/399\n", + "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:56:46,538 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:56:46,543 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9240, LAS: 0.8692, UEM: 0.6476, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.4776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9016, batch_reg_loss: 0.1588, reg_loss: 0.1587 ||: 3%|2 | 3/111 [00:02<01:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9277, LAS: 0.8749, UEM: 0.6799, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.5734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.8611, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 5%|5 | 6/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9217, LAS: 0.8687, UEM: 0.6278, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3600, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9148, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||: 9%|9 | 10/111 [00:06<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9316, LAS: 0.8807, UEM: 0.6713, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1199, partial_loss/deprel_loss: 0.2607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.8255, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||: 13%|#2 | 14/111 [00:09<01:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9349, LAS: 0.8836, UEM: 0.6458, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6169, partial_loss/deprel_loss: 0.6818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8278, loss: 0.8022, batch_reg_loss: 0.1590, reg_loss: 0.1589 ||: 16%|#6 | 18/111 [00:11<01:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9336, LAS: 0.8810, UEM: 0.6118, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.8718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 0.8227, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||: 20%|#9 | 22/111 [00:14<00:58, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9371, LAS: 0.8849, UEM: 0.6244, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4766, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7951, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||: 23%|##3 | 26/111 [00:17<00:55, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9349, LAS: 0.8821, UEM: 0.5989, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2324, partial_loss/deprel_loss: 1.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2964, loss: 0.8195, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||: 26%|##6 | 29/111 [00:19<00:55, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9340, LAS: 0.8813, UEM: 0.5833, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5935, loss: 0.8260, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||: 30%|##9 | 33/111 [00:21<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9356, LAS: 0.8825, UEM: 0.5790, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3626, partial_loss/deprel_loss: 0.5307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.8157, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||: 33%|###3 | 37/111 [00:24<00:48, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9346, LAS: 0.8810, UEM: 0.5659, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5879, partial_loss/deprel_loss: 0.6852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8250, loss: 0.8271, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||: 37%|###6 | 41/111 [00:26<00:44, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9339, LAS: 0.8803, UEM: 0.5605, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8325, batch_reg_loss: 0.1594, reg_loss: 0.1591 ||: 41%|#### | 45/111 [00:29<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9337, LAS: 0.8795, UEM: 0.5521, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7545, loss: 0.8381, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||: 44%|####4 | 49/111 [00:32<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9334, LAS: 0.8794, UEM: 0.5531, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6150, loss: 0.8376, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||: 47%|####6 | 52/111 [00:34<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9332, LAS: 0.8791, UEM: 0.5510, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1740, partial_loss/deprel_loss: 1.0353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2226, loss: 0.8416, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||: 50%|####9 | 55/111 [00:36<00:38, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9325, LAS: 0.8786, UEM: 0.5527, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8446, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||: 53%|#####3 | 59/111 [00:39<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9332, LAS: 0.8796, UEM: 0.5727, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9880, partial_loss/deprel_loss: 0.8851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0654, loss: 0.8385, batch_reg_loss: 0.1597, reg_loss: 0.1592 ||: 56%|#####5 | 62/111 [00:41<00:36, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9340, LAS: 0.8803, UEM: 0.5741, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6115, partial_loss/deprel_loss: 0.6343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8323, batch_reg_loss: 0.1598, reg_loss: 0.1592 ||: 59%|#####8 | 65/111 [00:43<00:33, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9338, LAS: 0.8803, UEM: 0.5767, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1369, partial_loss/deprel_loss: 0.9492, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8330, batch_reg_loss: 0.1598, reg_loss: 0.1593 ||: 62%|######2 | 69/111 [00:46<00:28, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9338, LAS: 0.8799, UEM: 0.5702, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4896, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7990, loss: 0.8342, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||: 66%|######5 | 73/111 [00:48<00:25, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9336, LAS: 0.8800, UEM: 0.5638, LEM: 0.3331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5143, partial_loss/deprel_loss: 0.6041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.8336, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||: 69%|######9 | 77/111 [00:51<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9337, LAS: 0.8802, UEM: 0.5669, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.8323, batch_reg_loss: 0.1600, reg_loss: 0.1594 ||: 73%|#######2 | 81/111 [00:53<00:19, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9341, LAS: 0.8807, UEM: 0.5677, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3866, partial_loss/deprel_loss: 0.5101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.8288, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||: 77%|#######6 | 85/111 [00:56<00:17, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9332, LAS: 0.8796, UEM: 0.5588, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8323, loss: 0.8376, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||: 80%|######## | 89/111 [00:58<00:13, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9322, LAS: 0.8785, UEM: 0.5490, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9825, partial_loss/deprel_loss: 0.9410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1095, loss: 0.8454, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||: 84%|########3 | 93/111 [01:01<00:11, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9322, LAS: 0.8783, UEM: 0.5471, LEM: 0.3206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.8462, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||: 87%|########7 | 97/111 [01:03<00:08, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9324, LAS: 0.8783, UEM: 0.5435, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6677, partial_loss/deprel_loss: 0.8023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8459, batch_reg_loss: 0.1603, reg_loss: 0.1595 ||: 91%|######### | 101/111 [01:06<00:06, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8043, UAS: 0.9309, LAS: 0.8766, UEM: 0.5376, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7838, partial_loss/deprel_loss: 1.3054, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5615, loss: 0.8610, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||: 95%|#########4| 105/111 [01:09<00:03, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9305, LAS: 0.8760, UEM: 0.5314, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2171, partial_loss/deprel_loss: 1.0465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2410, loss: 0.8685, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||: 98%|#########8| 109/111 [01:11<00:01, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8590, UAS: 0.9298, LAS: 0.8752, UEM: 0.5275, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0356, partial_loss/deprel_loss: 0.8129, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8747, batch_reg_loss: 0.1605, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-06 23:57:59,081 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.813 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.036 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UEM | 0.528 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - loss | 0.875 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEM | 0.303 | N/A\n", + "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EM | 0.859 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Epoch duration: 0:01:12.545910\n", + "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Estimated training time remaining: 7:36:23\n", + "2023-04-06 23:57:59,083 - INFO - allennlp.training.trainer - Epoch 52/399\n", + "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:57:59,089 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9408, LAS: 0.8872, UEM: 0.4940, LEM: 0.2390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.7606, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 3%|2 | 3/111 [00:02<01:12, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9258, LAS: 0.8711, UEM: 0.3767, LEM: 0.1598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6446, partial_loss/deprel_loss: 0.7826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9156, loss: 0.9016, batch_reg_loss: 0.1606, reg_loss: 0.1605 ||: 6%|6 | 7/111 [00:04<01:08, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9247, LAS: 0.8681, UEM: 0.3929, LEM: 0.1730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.9226, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||: 10%|9 | 11/111 [00:06<01:04, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9313, LAS: 0.8752, UEM: 0.4850, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9508, partial_loss/deprel_loss: 0.9080, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0773, loss: 0.8719, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||: 14%|#3 | 15/111 [00:09<01:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9278, LAS: 0.8711, UEM: 0.4450, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4530, partial_loss/deprel_loss: 1.1169, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3450, loss: 0.9087, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||: 17%|#7 | 19/111 [00:11<00:55, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9296, LAS: 0.8736, UEM: 0.4856, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6275, loss: 0.8893, batch_reg_loss: 0.1609, reg_loss: 0.1607 ||: 21%|## | 23/111 [00:13<00:53, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9339, LAS: 0.8787, UEM: 0.5379, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.4749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8470, batch_reg_loss: 0.1610, reg_loss: 0.1607 ||: 24%|##4 | 27/111 [00:16<00:49, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8564, UAS: 0.9342, LAS: 0.8793, UEM: 0.5529, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7539, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9725, loss: 0.8433, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||: 28%|##7 | 31/111 [00:18<00:48, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9329, LAS: 0.8781, UEM: 0.5454, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6378, loss: 0.8515, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||: 32%|###1 | 35/111 [00:21<00:46, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9309, LAS: 0.8760, UEM: 0.5404, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7887, partial_loss/deprel_loss: 0.8330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9853, loss: 0.8660, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||: 35%|###5 | 39/111 [00:23<00:43, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8754, UEM: 0.5276, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9182, partial_loss/deprel_loss: 0.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8703, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||: 39%|###8 | 43/111 [00:26<00:43, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9305, LAS: 0.8753, UEM: 0.5139, LEM: 0.2856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4979, partial_loss/deprel_loss: 0.6616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.8702, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||: 42%|####2 | 47/111 [00:29<00:41, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9313, LAS: 0.8764, UEM: 0.5228, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6453, loss: 0.8633, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||: 46%|####5 | 51/111 [00:32<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9325, LAS: 0.8777, UEM: 0.5325, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6361, loss: 0.8511, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||: 49%|####8 | 54/111 [00:34<00:42, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9318, LAS: 0.8771, UEM: 0.5251, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0108, partial_loss/deprel_loss: 0.8002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0038, loss: 0.8569, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||: 51%|#####1 | 57/111 [00:37<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9325, LAS: 0.8778, UEM: 0.5387, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9103, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0841, loss: 0.8512, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||: 54%|#####4 | 60/111 [00:39<00:36, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9320, LAS: 0.8774, UEM: 0.5422, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4026, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7204, loss: 0.8555, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||: 57%|#####6 | 63/111 [00:41<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7904, UAS: 0.9314, LAS: 0.8768, UEM: 0.5508, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7467, partial_loss/deprel_loss: 1.1340, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4181, loss: 0.8571, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||: 59%|#####9 | 66/111 [00:43<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9300, LAS: 0.8752, UEM: 0.5399, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6887, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8997, loss: 0.8692, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||: 63%|######3 | 70/111 [00:45<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7555, UAS: 0.9286, LAS: 0.8739, UEM: 0.5343, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7179, partial_loss/deprel_loss: 1.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8845, loss: 0.8808, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||: 66%|######5 | 73/111 [00:47<00:26, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9288, LAS: 0.8740, UEM: 0.5333, LEM: 0.2995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5149, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8786, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||: 69%|######9 | 77/111 [00:50<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9295, LAS: 0.8748, UEM: 0.5507, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9174, partial_loss/deprel_loss: 0.9188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0803, loss: 0.8734, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||: 72%|#######2 | 80/111 [00:52<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9300, LAS: 0.8753, UEM: 0.5510, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8682, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||: 75%|#######4 | 83/111 [00:54<00:19, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9305, LAS: 0.8758, UEM: 0.5480, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0668, loss: 0.8654, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||: 78%|#######8 | 87/111 [00:57<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9295, LAS: 0.8745, UEM: 0.5390, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1307, partial_loss/deprel_loss: 0.9379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1385, loss: 0.8737, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||: 82%|########1 | 91/111 [00:59<00:12, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9304, LAS: 0.8754, UEM: 0.5423, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5534, partial_loss/deprel_loss: 0.6744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8675, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||: 86%|########5 | 95/111 [01:01<00:10, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9307, LAS: 0.8758, UEM: 0.5385, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7639, loss: 0.8670, batch_reg_loss: 0.1621, reg_loss: 0.1613 ||: 89%|########9 | 99/111 [01:04<00:07, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9301, LAS: 0.8751, UEM: 0.5371, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8170, partial_loss/deprel_loss: 0.7834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8710, batch_reg_loss: 0.1622, reg_loss: 0.1613 ||: 93%|#########2| 103/111 [01:07<00:05, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9301, LAS: 0.8751, UEM: 0.5326, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2890, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2153, loss: 0.8726, batch_reg_loss: 0.1622, reg_loss: 0.1614 ||: 96%|#########6| 107/111 [01:09<00:02, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.577 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.412 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - reg_loss | 0.161 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UEM | 0.531 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - loss | 0.871 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEM | 0.299 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EM | 0.903 | N/A\n", + "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Epoch duration: 0:01:12.692473\n", + "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Estimated training time remaining: 7:34:25\n", + "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Epoch 53/399\n", + "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-06 23:59:11,782 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9467, LAS: 0.8928, UEM: 0.5404, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5696, partial_loss/deprel_loss: 0.5960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.7637, batch_reg_loss: 0.1623, reg_loss: 0.1623 ||: 3%|2 | 3/111 [00:02<01:12, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9464, LAS: 0.8947, UEM: 0.5560, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5968, partial_loss/deprel_loss: 0.5837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.7131, batch_reg_loss: 0.1624, reg_loss: 0.1623 ||: 6%|6 | 7/111 [00:04<01:08, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9365, LAS: 0.8817, UEM: 0.4906, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8449, partial_loss/deprel_loss: 0.7423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9252, loss: 0.8082, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||: 10%|9 | 11/111 [00:07<01:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9394, LAS: 0.8855, UEM: 0.5849, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.7742, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||: 13%|#2 | 14/111 [00:09<01:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9397, LAS: 0.8861, UEM: 0.5769, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3935, partial_loss/deprel_loss: 0.5610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6901, loss: 0.7727, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||: 15%|#5 | 17/111 [00:11<01:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9409, LAS: 0.8868, UEM: 0.5687, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5827, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.7743, batch_reg_loss: 0.1626, reg_loss: 0.1624 ||: 19%|#8 | 21/111 [00:13<00:57, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8515, UAS: 0.9382, LAS: 0.8830, UEM: 0.5330, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7980, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9719, loss: 0.8025, batch_reg_loss: 0.1626, reg_loss: 0.1625 ||: 23%|##2 | 25/111 [00:16<00:54, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9323, LAS: 0.8767, UEM: 0.5110, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0175, partial_loss/deprel_loss: 0.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8586, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||: 25%|##5 | 28/111 [00:18<00:54, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9278, LAS: 0.8720, UEM: 0.4900, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1837, partial_loss/deprel_loss: 0.8709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0962, loss: 0.8946, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||: 28%|##7 | 31/111 [00:20<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9276, LAS: 0.8718, UEM: 0.4794, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6420, loss: 0.8936, batch_reg_loss: 0.1628, reg_loss: 0.1625 ||: 31%|### | 34/111 [00:22<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9292, LAS: 0.8736, UEM: 0.4858, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8827, batch_reg_loss: 0.1628, reg_loss: 0.1626 ||: 34%|###4 | 38/111 [00:25<00:48, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9295, LAS: 0.8742, UEM: 0.4897, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.6584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7828, loss: 0.8813, batch_reg_loss: 0.1629, reg_loss: 0.1626 ||: 38%|###7 | 42/111 [00:27<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9311, LAS: 0.8761, UEM: 0.5027, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.8652, batch_reg_loss: 0.1630, reg_loss: 0.1626 ||: 41%|####1 | 46/111 [00:30<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9320, LAS: 0.8773, UEM: 0.5124, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5651, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.8546, batch_reg_loss: 0.1630, reg_loss: 0.1627 ||: 45%|####5 | 50/111 [00:33<00:41, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9308, LAS: 0.8758, UEM: 0.5093, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1829, partial_loss/deprel_loss: 0.9669, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1732, loss: 0.8625, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||: 48%|####7 | 53/111 [00:35<00:40, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.9278, LAS: 0.8724, UEM: 0.4995, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.1906, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4580, loss: 0.8887, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||: 51%|#####1 | 57/111 [00:37<00:35, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9276, LAS: 0.8723, UEM: 0.4999, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5744, partial_loss/deprel_loss: 1.0889, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3492, loss: 0.8901, batch_reg_loss: 0.1632, reg_loss: 0.1627 ||: 55%|#####4 | 61/111 [00:39<00:31, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9285, LAS: 0.8731, UEM: 0.5093, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6473, partial_loss/deprel_loss: 0.7667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9061, loss: 0.8856, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||: 59%|#####8 | 65/111 [00:42<00:29, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9278, LAS: 0.8724, UEM: 0.5045, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4895, partial_loss/deprel_loss: 0.5364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.8913, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||: 62%|######2 | 69/111 [00:45<00:27, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8434, UAS: 0.9266, LAS: 0.8711, UEM: 0.4930, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0492, partial_loss/deprel_loss: 1.0301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1973, loss: 0.9030, batch_reg_loss: 0.1634, reg_loss: 0.1628 ||: 66%|######5 | 73/111 [00:47<00:24, 1.57it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9267, LAS: 0.8713, UEM: 0.4968, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6938, loss: 0.9019, batch_reg_loss: 0.1635, reg_loss: 0.1629 ||: 69%|######9 | 77/111 [00:50<00:22, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9279, LAS: 0.8725, UEM: 0.5080, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.5856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7172, loss: 0.8911, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||: 73%|#######2 | 81/111 [00:53<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9288, LAS: 0.8735, UEM: 0.5127, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8488, loss: 0.8845, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||: 76%|#######5 | 84/111 [00:55<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9295, LAS: 0.8742, UEM: 0.5182, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6469, partial_loss/deprel_loss: 0.6858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8417, loss: 0.8779, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||: 78%|#######8 | 87/111 [00:58<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9290, LAS: 0.8735, UEM: 0.5111, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 0.9826, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.8841, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||: 81%|########1 | 90/111 [01:00<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9303, LAS: 0.8751, UEM: 0.5402, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2008, partial_loss/deprel_loss: 0.3759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.8728, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||: 84%|########3 | 93/111 [01:02<00:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8101, UAS: 0.9297, LAS: 0.8744, UEM: 0.5358, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3972, partial_loss/deprel_loss: 1.1130, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3336, loss: 0.8781, batch_reg_loss: 0.1638, reg_loss: 0.1630 ||: 87%|########7 | 97/111 [01:04<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9295, LAS: 0.8743, UEM: 0.5347, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3269, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3058, loss: 0.8800, batch_reg_loss: 0.1638, reg_loss: 0.1631 ||: 90%|######### | 100/111 [01:07<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9296, LAS: 0.8744, UEM: 0.5320, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3737, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.8794, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||: 94%|#########3| 104/111 [01:09<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9301, LAS: 0.8749, UEM: 0.5330, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9118, partial_loss/deprel_loss: 0.9566, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8764, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||: 97%|#########7| 108/111 [01:12<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 00:00:26,510 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.987 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.070 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - reg_loss | 0.163 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UEM | 0.533 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LAS | 0.875 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - loss | 0.877 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEM | 0.298 | N/A\n", + "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EM | 0.840 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:00:26,512 - INFO - combo.training.trainer - Epoch duration: 0:01:14.736354\n", + "2023-04-07 00:00:26,513 - INFO - combo.training.trainer - Estimated training time remaining: 7:32:42\n", + "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Epoch 54/399\n", + "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:00:26,520 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9448, LAS: 0.8931, UEM: 0.7116, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2033, partial_loss/deprel_loss: 0.3485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.7435, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 3%|2 | 3/111 [00:02<01:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9409, LAS: 0.8887, UEM: 0.5927, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3385, partial_loss/deprel_loss: 0.4904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6241, loss: 0.7844, batch_reg_loss: 0.1641, reg_loss: 0.1640 ||: 6%|6 | 7/111 [00:04<01:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9355, LAS: 0.8830, UEM: 0.5229, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 0.8782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0361, loss: 0.8226, batch_reg_loss: 0.1641, reg_loss: 0.1641 ||: 10%|9 | 11/111 [00:06<01:05, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9305, LAS: 0.8779, UEM: 0.5623, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.3135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4483, loss: 0.8639, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||: 13%|#2 | 14/111 [00:09<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9307, LAS: 0.8791, UEM: 0.6237, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1766, partial_loss/deprel_loss: 0.9353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1478, loss: 0.8571, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||: 15%|#5 | 17/111 [00:13<01:29, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9324, LAS: 0.8798, UEM: 0.5994, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4481, partial_loss/deprel_loss: 0.6010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8410, batch_reg_loss: 0.1643, reg_loss: 0.1641 ||: 19%|#8 | 21/111 [00:16<01:18, 1.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9320, LAS: 0.8789, UEM: 0.5892, LEM: 0.3873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5723, loss: 0.8520, batch_reg_loss: 0.1643, reg_loss: 0.1642 ||: 22%|##1 | 24/111 [00:19<01:13, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9321, LAS: 0.8784, UEM: 0.5624, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5136, partial_loss/deprel_loss: 0.6196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7628, loss: 0.8548, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||: 25%|##5 | 28/111 [00:21<01:04, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9341, LAS: 0.8809, UEM: 0.5804, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.3954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.8333, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||: 28%|##7 | 31/111 [00:23<01:02, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9328, LAS: 0.8791, UEM: 0.5736, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.8460, batch_reg_loss: 0.1645, reg_loss: 0.1642 ||: 31%|### | 34/111 [00:26<00:59, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9333, LAS: 0.8795, UEM: 0.5669, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.8440, batch_reg_loss: 0.1645, reg_loss: 0.1643 ||: 33%|###3 | 37/111 [00:28<00:55, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9334, LAS: 0.8801, UEM: 0.5717, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 0.9017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8380, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||: 36%|###6 | 40/111 [00:30<00:53, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9321, LAS: 0.8783, UEM: 0.5681, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1812, partial_loss/deprel_loss: 0.8796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1046, loss: 0.8479, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||: 39%|###8 | 43/111 [00:32<00:50, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9331, LAS: 0.8794, UEM: 0.5662, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 0.8421, batch_reg_loss: 0.1647, reg_loss: 0.1643 ||: 42%|####2 | 47/111 [00:35<00:45, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9321, LAS: 0.8786, UEM: 0.5562, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3762, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6528, loss: 0.8515, batch_reg_loss: 0.1647, reg_loss: 0.1644 ||: 46%|####5 | 51/111 [00:37<00:40, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9321, LAS: 0.8786, UEM: 0.5521, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5805, loss: 0.8509, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||: 49%|####8 | 54/111 [00:39<00:39, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9332, LAS: 0.8799, UEM: 0.5667, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4449, partial_loss/deprel_loss: 0.6679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8421, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||: 51%|#####1 | 57/111 [00:41<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7900, UAS: 0.9308, LAS: 0.8773, UEM: 0.5544, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8413, partial_loss/deprel_loss: 1.2192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5085, loss: 0.8640, batch_reg_loss: 0.1649, reg_loss: 0.1644 ||: 55%|#####4 | 61/111 [00:44<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9321, LAS: 0.8786, UEM: 0.5625, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1444, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.8516, batch_reg_loss: 0.1649, reg_loss: 0.1645 ||: 59%|#####8 | 65/111 [00:47<00:31, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9318, LAS: 0.8784, UEM: 0.5630, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4898, partial_loss/deprel_loss: 0.6133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.8540, batch_reg_loss: 0.1650, reg_loss: 0.1645 ||: 62%|######2 | 69/111 [00:49<00:28, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9320, LAS: 0.8785, UEM: 0.5594, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.5626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8529, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||: 65%|######4 | 72/111 [00:52<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9308, LAS: 0.8771, UEM: 0.5510, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0675, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 0.8638, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||: 68%|######7 | 75/111 [00:54<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9300, LAS: 0.8759, UEM: 0.5432, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3399, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2233, loss: 0.8729, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||: 70%|####### | 78/111 [00:56<00:22, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9305, LAS: 0.8765, UEM: 0.5447, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6205, partial_loss/deprel_loss: 0.7112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8583, loss: 0.8691, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||: 73%|#######2 | 81/111 [00:58<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9294, LAS: 0.8752, UEM: 0.5381, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5750, partial_loss/deprel_loss: 0.6413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8801, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||: 77%|#######6 | 85/111 [01:00<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9299, LAS: 0.8759, UEM: 0.5388, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7982, loss: 0.8754, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||: 79%|#######9 | 88/111 [01:02<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9307, LAS: 0.8765, UEM: 0.5455, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2060, partial_loss/deprel_loss: 0.3806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.8701, batch_reg_loss: 0.1654, reg_loss: 0.1647 ||: 83%|########2 | 92/111 [01:05<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8516, UAS: 0.9298, LAS: 0.8756, UEM: 0.5412, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0076, partial_loss/deprel_loss: 0.9710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1438, loss: 0.8782, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||: 86%|########6 | 96/111 [01:08<00:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9303, LAS: 0.8761, UEM: 0.5436, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7639, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9688, loss: 0.8738, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||: 89%|########9 | 99/111 [01:10<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9296, LAS: 0.8754, UEM: 0.5380, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1404, loss: 0.8794, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||: 92%|#########1| 102/111 [01:12<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9302, LAS: 0.8761, UEM: 0.5385, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5787, loss: 0.8726, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||: 95%|#########5| 106/111 [01:14<00:03, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9303, LAS: 0.8761, UEM: 0.5354, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8501, partial_loss/deprel_loss: 0.8843, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0431, loss: 0.8737, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||: 99%|#########9| 110/111 [01:17<00:00, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9302, LAS: 0.8760, UEM: 0.5334, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.7209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9017, loss: 0.8739, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||: 100%|##########| 111/111 [01:17<00:00, 1.42it/s]\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.721 | N/A\n", + "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.797 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - reg_loss | 0.165 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UEM | 0.533 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LAS | 0.876 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - loss | 0.874 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEM | 0.302 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EM | 0.865 | N/A\n", + "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Epoch duration: 0:01:17.993194\n", + "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:20\n", + "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Epoch 55/399\n", + "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:01:44,507 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:01:44,513 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9378, LAS: 0.8843, UEM: 0.6189, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6997, loss: 0.7860, batch_reg_loss: 0.1657, reg_loss: 0.1657 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9324, LAS: 0.8764, UEM: 0.4882, LEM: 0.2407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0905, partial_loss/deprel_loss: 1.0808, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2485, loss: 0.8774, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 6%|6 | 7/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.9306, LAS: 0.8749, UEM: 0.4708, LEM: 0.2315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0499, loss: 0.8856, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||: 10%|9 | 11/111 [00:07<01:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9339, LAS: 0.8782, UEM: 0.5102, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5669, loss: 0.8600, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||: 14%|#3 | 15/111 [00:09<01:01, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9279, LAS: 0.8717, UEM: 0.4778, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0383, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9098, batch_reg_loss: 0.1660, reg_loss: 0.1659 ||: 17%|#7 | 19/111 [00:11<00:58, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9278, LAS: 0.8715, UEM: 0.4733, LEM: 0.2227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3426, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.9059, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||: 21%|## | 23/111 [00:14<00:55, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9272, LAS: 0.8709, UEM: 0.4712, LEM: 0.2228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2936, partial_loss/deprel_loss: 0.4856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6133, loss: 0.9143, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||: 23%|##3 | 26/111 [00:16<00:55, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9271, LAS: 0.8711, UEM: 0.4586, LEM: 0.2171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7521, partial_loss/deprel_loss: 0.7589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9237, loss: 0.9126, batch_reg_loss: 0.1662, reg_loss: 0.1659 ||: 26%|##6 | 29/111 [00:18<00:57, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9291, LAS: 0.8736, UEM: 0.4894, LEM: 0.2468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7406, loss: 0.8919, batch_reg_loss: 0.1662, reg_loss: 0.1660 ||: 29%|##8 | 32/111 [00:21<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9282, LAS: 0.8727, UEM: 0.5098, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8966, batch_reg_loss: 0.1663, reg_loss: 0.1660 ||: 32%|###2 | 36/111 [00:24<00:54, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9284, LAS: 0.8732, UEM: 0.5109, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2249, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.8943, batch_reg_loss: 0.1664, reg_loss: 0.1660 ||: 36%|###6 | 40/111 [00:26<00:50, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9290, LAS: 0.8739, UEM: 0.5005, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5359, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7525, loss: 0.8865, batch_reg_loss: 0.1664, reg_loss: 0.1661 ||: 40%|###9 | 44/111 [00:29<00:44, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9300, LAS: 0.8750, UEM: 0.5045, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0223, partial_loss/deprel_loss: 0.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1136, loss: 0.8820, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||: 43%|####3 | 48/111 [00:31<00:41, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9303, LAS: 0.8755, UEM: 0.5021, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7655, partial_loss/deprel_loss: 0.7056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.8792, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||: 47%|####6 | 52/111 [00:34<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9302, LAS: 0.8753, UEM: 0.4943, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8802, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||: 50%|####9 | 55/111 [00:36<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9292, LAS: 0.8742, UEM: 0.4979, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3299, partial_loss/deprel_loss: 0.5148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6445, loss: 0.8854, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||: 52%|#####2 | 58/111 [00:38<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9300, LAS: 0.8748, UEM: 0.4960, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5726, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7943, loss: 0.8809, batch_reg_loss: 0.1667, reg_loss: 0.1662 ||: 56%|#####5 | 62/111 [00:41<00:33, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9287, LAS: 0.8734, UEM: 0.4838, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3249, partial_loss/deprel_loss: 0.9868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2212, loss: 0.8900, batch_reg_loss: 0.1668, reg_loss: 0.1662 ||: 59%|#####9 | 66/111 [00:44<00:30, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9292, LAS: 0.8740, UEM: 0.4893, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5890, loss: 0.8867, batch_reg_loss: 0.1668, reg_loss: 0.1663 ||: 62%|######2 | 69/111 [00:46<00:29, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9279, LAS: 0.8726, UEM: 0.4918, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.8979, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||: 66%|######5 | 73/111 [00:49<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9283, LAS: 0.8730, UEM: 0.4954, LEM: 0.2557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4216, partial_loss/deprel_loss: 0.5738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.8955, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||: 68%|######8 | 76/111 [00:51<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9292, LAS: 0.8739, UEM: 0.5096, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1119, partial_loss/deprel_loss: 0.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4047, loss: 0.8890, batch_reg_loss: 0.1670, reg_loss: 0.1663 ||: 71%|#######1 | 79/111 [00:53<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9288, LAS: 0.8736, UEM: 0.5289, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.1641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3149, loss: 0.8923, batch_reg_loss: 0.1670, reg_loss: 0.1664 ||: 74%|#######3 | 82/111 [00:55<00:21, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9287, LAS: 0.8735, UEM: 0.5236, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8288, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.8928, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9293, LAS: 0.8741, UEM: 0.5222, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2973, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.8897, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||: 81%|########1 | 90/111 [01:00<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9300, LAS: 0.8750, UEM: 0.5309, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.4656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6126, loss: 0.8813, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||: 84%|########3 | 93/111 [01:02<00:12, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9304, LAS: 0.8754, UEM: 0.5302, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.8764, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||: 86%|########6 | 96/111 [01:05<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9304, LAS: 0.8755, UEM: 0.5246, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9842, partial_loss/deprel_loss: 0.9223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1020, loss: 0.8779, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||: 90%|######### | 100/111 [01:07<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9302, LAS: 0.8752, UEM: 0.5250, LEM: 0.2941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3074, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 0.8795, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||: 93%|#########2| 103/111 [01:09<00:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9305, LAS: 0.8756, UEM: 0.5243, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3452, partial_loss/deprel_loss: 0.4917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6297, loss: 0.8772, batch_reg_loss: 0.1673, reg_loss: 0.1666 ||: 96%|#########6| 107/111 [01:12<00:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9307, LAS: 0.8759, UEM: 0.5311, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0582, partial_loss/deprel_loss: 0.8997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8732, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||: 99%|#########9| 110/111 [01:14<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9310, LAS: 0.8761, UEM: 0.5327, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3381, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6897, loss: 0.8716, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-07 00:03:00,154 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9457, LAS: 0.8973, UEM: 0.7127, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2112, partial_loss/deprel_loss: 20.6524, partial_loss/cycle_loss: 0.0000, batch_loss: 16.5642, loss: 23.9662, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9355, LAS: 0.8835, UEM: 0.6797, LEM: 0.4542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6319, partial_loss/deprel_loss: 58.9152, partial_loss/cycle_loss: 0.0000, batch_loss: 47.4585, loss: 28.1342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:05<00:08, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9338, LAS: 0.8808, UEM: 0.6146, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 30.3347, partial_loss/cycle_loss: 0.0000, batch_loss: 24.4169, loss: 29.2772, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:07<00:06, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9387, LAS: 0.8860, UEM: 0.6328, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5421, partial_loss/deprel_loss: 24.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7214, loss: 27.9239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:09<00:02, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.05it/s]\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.568 | 34.831\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.338 | 0.708\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - reg_loss | 0.167 | 0.000\n", + "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UEM | 0.533 | 0.637\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LAS | 0.876 | 0.890\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - loss | 0.872 | 26.260\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEM | 0.300 | 0.368\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - UAS | 0.931 | 0.943\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EM | 0.901 | 0.886\n", + "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Epoch duration: 0:01:28.088627\n", + "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:01\n", + "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Epoch 56/399\n", + "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:03:12,602 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9052, LAS: 0.8484, UEM: 0.3495, LEM: 0.1702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4177, partial_loss/deprel_loss: 0.5719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 1.0817, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 3%|2 | 3/111 [00:02<01:19, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9245, LAS: 0.8711, UEM: 0.3775, LEM: 0.1822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7256, partial_loss/deprel_loss: 0.7942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.9261, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||: 6%|6 | 7/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8121, UAS: 0.9251, LAS: 0.8701, UEM: 0.4158, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5426, partial_loss/deprel_loss: 1.1777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4182, loss: 0.9325, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||: 10%|9 | 11/111 [00:06<01:06, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9213, LAS: 0.8668, UEM: 0.4016, LEM: 0.1869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7875, loss: 0.9613, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||: 14%|#3 | 15/111 [00:09<01:02, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9253, LAS: 0.8701, UEM: 0.4440, LEM: 0.2079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.9270, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||: 16%|#6 | 18/111 [00:11<01:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9262, LAS: 0.8708, UEM: 0.4256, LEM: 0.1955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7134, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9461, loss: 0.9189, batch_reg_loss: 0.1677, reg_loss: 0.1675 ||: 19%|#8 | 21/111 [00:13<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9281, LAS: 0.8735, UEM: 0.4891, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2322, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.8989, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||: 22%|##1 | 24/111 [00:15<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9323, LAS: 0.8779, UEM: 0.5258, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6955, partial_loss/deprel_loss: 0.6607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8355, loss: 0.8635, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||: 25%|##5 | 28/111 [00:18<00:55, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9335, LAS: 0.8788, UEM: 0.5304, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6671, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8448, loss: 0.8535, batch_reg_loss: 0.1679, reg_loss: 0.1676 ||: 29%|##8 | 32/111 [00:20<00:51, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.9307, LAS: 0.8755, UEM: 0.5065, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8566, partial_loss/deprel_loss: 0.7906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9718, loss: 0.8817, batch_reg_loss: 0.1679, reg_loss: 0.1677 ||: 32%|###2 | 36/111 [00:23<00:47, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9307, LAS: 0.8759, UEM: 0.5141, LEM: 0.2816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.8756, batch_reg_loss: 0.1680, reg_loss: 0.1677 ||: 36%|###6 | 40/111 [00:26<00:47, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9301, LAS: 0.8756, UEM: 0.5189, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9675, partial_loss/deprel_loss: 0.9376, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8777, batch_reg_loss: 0.1681, reg_loss: 0.1677 ||: 40%|###9 | 44/111 [00:28<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9300, LAS: 0.8757, UEM: 0.5087, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5739, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7143, loss: 0.8775, batch_reg_loss: 0.1681, reg_loss: 0.1678 ||: 43%|####3 | 48/111 [00:31<00:40, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9298, LAS: 0.8754, UEM: 0.5231, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3955, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7318, loss: 0.8786, batch_reg_loss: 0.1682, reg_loss: 0.1678 ||: 47%|####6 | 52/111 [00:33<00:38, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9317, LAS: 0.8777, UEM: 0.5608, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.8624, batch_reg_loss: 0.1683, reg_loss: 0.1678 ||: 50%|##### | 56/111 [00:36<00:35, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9320, LAS: 0.8779, UEM: 0.5538, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7732, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9828, loss: 0.8628, batch_reg_loss: 0.1683, reg_loss: 0.1679 ||: 54%|#####4 | 60/111 [00:38<00:32, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9315, LAS: 0.8774, UEM: 0.5514, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5800, loss: 0.8651, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||: 58%|#####7 | 64/111 [00:41<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9296, LAS: 0.8752, UEM: 0.5375, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9756, loss: 0.8823, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||: 61%|######1 | 68/111 [00:44<00:28, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9303, LAS: 0.8758, UEM: 0.5345, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6570, partial_loss/deprel_loss: 0.7377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8901, loss: 0.8786, batch_reg_loss: 0.1685, reg_loss: 0.1679 ||: 65%|######4 | 72/111 [00:46<00:25, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9287, LAS: 0.8742, UEM: 0.5252, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5470, partial_loss/deprel_loss: 0.9589, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2450, loss: 0.8900, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||: 68%|######8 | 76/111 [00:49<00:22, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9281, LAS: 0.8733, UEM: 0.5200, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0865, partial_loss/deprel_loss: 0.9616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1552, loss: 0.8975, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||: 72%|#######2 | 80/111 [00:51<00:19, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9276, LAS: 0.8728, UEM: 0.5178, LEM: 0.3011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2355, partial_loss/deprel_loss: 0.3739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.9017, batch_reg_loss: 0.1687, reg_loss: 0.1680 ||: 76%|#######5 | 84/111 [00:54<00:17, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9287, LAS: 0.8741, UEM: 0.5313, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9235, partial_loss/deprel_loss: 0.8001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9935, loss: 0.8910, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||: 79%|#######9 | 88/111 [00:57<00:15, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9295, LAS: 0.8749, UEM: 0.5379, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.3850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.8835, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||: 82%|########1 | 91/111 [00:59<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9292, LAS: 0.8745, UEM: 0.5322, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 1.0392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2448, loss: 0.8888, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||: 85%|########4 | 94/111 [01:01<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9293, LAS: 0.8746, UEM: 0.5293, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1261, partial_loss/deprel_loss: 0.9523, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1560, loss: 0.8880, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||: 87%|########7 | 97/111 [01:04<00:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9299, LAS: 0.8754, UEM: 0.5300, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.5280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6709, loss: 0.8825, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||: 91%|######### | 101/111 [01:06<00:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9300, LAS: 0.8756, UEM: 0.5286, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7124, loss: 0.8817, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||: 94%|#########3| 104/111 [01:08<00:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9309, LAS: 0.8767, UEM: 0.5328, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6869, loss: 0.8740, batch_reg_loss: 0.1691, reg_loss: 0.1682 ||: 97%|#########7| 108/111 [01:11<00:02, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.513 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.350 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - reg_loss | 0.168 | N/A\n", + "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UEM | 0.534 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LAS | 0.877 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - loss | 0.871 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEM | 0.305 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - UAS | 0.931 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EM | 0.904 | N/A\n", + "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Epoch duration: 0:01:14.079801\n", + "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Estimated training time remaining: 7:29:14\n", + "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Epoch 57/399\n", + "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:04:26,683 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9574, LAS: 0.9082, UEM: 0.6799, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.3836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.6548, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 3%|2 | 3/111 [00:02<01:22, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9448, LAS: 0.8923, UEM: 0.5579, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8817, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9765, loss: 0.7685, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||: 5%|5 | 6/111 [00:04<01:21, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9418, LAS: 0.8873, UEM: 0.5336, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.8019, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||: 8%|8 | 9/111 [00:06<01:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9361, LAS: 0.8815, UEM: 0.5493, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2932, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6116, loss: 0.8263, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||: 11%|# | 12/111 [00:08<01:13, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9336, LAS: 0.8793, UEM: 0.5382, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.6198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7686, loss: 0.8427, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||: 14%|#3 | 15/111 [00:10<01:09, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9344, LAS: 0.8807, UEM: 0.5316, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6276, loss: 0.8396, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||: 16%|#6 | 18/111 [00:13<01:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9383, LAS: 0.8858, UEM: 0.5676, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.8026, batch_reg_loss: 0.1694, reg_loss: 0.1692 ||: 20%|#9 | 22/111 [00:15<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9375, LAS: 0.8848, UEM: 0.5659, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.5643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.8037, batch_reg_loss: 0.1694, reg_loss: 0.1693 ||: 23%|##2 | 25/111 [00:17<01:01, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9375, LAS: 0.8849, UEM: 0.5632, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8074, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||: 25%|##5 | 28/111 [00:20<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9383, LAS: 0.8857, UEM: 0.5685, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5460, loss: 0.7991, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||: 28%|##7 | 31/111 [00:22<00:59, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9386, LAS: 0.8856, UEM: 0.5538, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6780, partial_loss/deprel_loss: 0.7338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.8009, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||: 32%|###1 | 35/111 [00:24<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9393, LAS: 0.8863, UEM: 0.5712, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.7953, batch_reg_loss: 0.1696, reg_loss: 0.1693 ||: 34%|###4 | 38/111 [00:27<00:50, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9381, LAS: 0.8853, UEM: 0.5535, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8753, partial_loss/deprel_loss: 0.8562, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8056, batch_reg_loss: 0.1696, reg_loss: 0.1694 ||: 38%|###7 | 42/111 [00:29<00:45, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9391, LAS: 0.8863, UEM: 0.5589, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2931, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5923, loss: 0.7981, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||: 41%|####1 | 46/111 [00:32<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9383, LAS: 0.8852, UEM: 0.5596, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2342, partial_loss/deprel_loss: 0.9472, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1743, loss: 0.8052, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||: 44%|####4 | 49/111 [00:34<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9382, LAS: 0.8851, UEM: 0.5530, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6501, loss: 0.8059, batch_reg_loss: 0.1698, reg_loss: 0.1694 ||: 47%|####6 | 52/111 [00:36<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9379, LAS: 0.8845, UEM: 0.5488, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.5204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6537, loss: 0.8090, batch_reg_loss: 0.1698, reg_loss: 0.1695 ||: 50%|##### | 56/111 [00:39<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9379, LAS: 0.8848, UEM: 0.5595, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2587, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1916, loss: 0.8063, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||: 53%|#####3 | 59/111 [00:41<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9372, LAS: 0.8841, UEM: 0.5497, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.7492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9366, loss: 0.8141, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||: 56%|#####5 | 62/111 [00:43<00:35, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9372, LAS: 0.8840, UEM: 0.5502, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.3824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5258, loss: 0.8138, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||: 59%|#####8 | 65/111 [00:46<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9362, LAS: 0.8828, UEM: 0.5413, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.7748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9505, loss: 0.8236, batch_reg_loss: 0.1700, reg_loss: 0.1695 ||: 61%|######1 | 68/111 [00:48<00:30, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9372, LAS: 0.8837, UEM: 0.5485, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2735, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.8154, batch_reg_loss: 0.1700, reg_loss: 0.1696 ||: 65%|######4 | 72/111 [00:50<00:27, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9369, LAS: 0.8832, UEM: 0.5447, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8168, partial_loss/deprel_loss: 0.7835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9603, loss: 0.8159, batch_reg_loss: 0.1701, reg_loss: 0.1696 ||: 68%|######8 | 76/111 [00:53<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9351, LAS: 0.8814, UEM: 0.5352, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8657, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0703, loss: 0.8321, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||: 72%|#######2 | 80/111 [00:55<00:20, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9344, LAS: 0.8804, UEM: 0.5286, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3138, partial_loss/deprel_loss: 0.9856, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2214, loss: 0.8418, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||: 76%|#######5 | 84/111 [00:58<00:17, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7678, UAS: 0.9332, LAS: 0.8793, UEM: 0.5226, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4154, partial_loss/deprel_loss: 1.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8261, loss: 0.8530, batch_reg_loss: 0.1703, reg_loss: 0.1697 ||: 79%|#######9 | 88/111 [01:00<00:15, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8031, UAS: 0.9315, LAS: 0.8773, UEM: 0.5138, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6813, partial_loss/deprel_loss: 1.2116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 0.8697, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||: 83%|########2 | 92/111 [01:03<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8146, UAS: 0.9307, LAS: 0.8762, UEM: 0.5060, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5085, partial_loss/deprel_loss: 1.0874, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3421, loss: 0.8791, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||: 86%|########6 | 96/111 [01:06<00:10, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9313, LAS: 0.8770, UEM: 0.5214, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 0.7930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9809, loss: 0.8718, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||: 89%|########9 | 99/111 [01:08<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8170, UAS: 0.9314, LAS: 0.8773, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5947, partial_loss/deprel_loss: 1.1252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3897, loss: 0.8706, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||: 92%|#########1| 102/111 [01:10<00:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9312, LAS: 0.8771, UEM: 0.5340, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3184, partial_loss/deprel_loss: 0.5107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8734, batch_reg_loss: 0.1706, reg_loss: 0.1698 ||: 95%|#########4| 105/111 [01:12<00:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9314, LAS: 0.8773, UEM: 0.5357, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1379, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.8727, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||: 98%|#########8| 109/111 [01:15<00:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9312, LAS: 0.8771, UEM: 0.5351, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3903, partial_loss/deprel_loss: 1.0609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2975, loss: 0.8749, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||: 100%|##########| 111/111 [01:16<00:00, 1.44it/s]\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.061 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.390 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - reg_loss | 0.170 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UEM | 0.535 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LAS | 0.877 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - loss | 0.875 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEM | 0.302 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UAS | 0.931 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EM | 0.832 | N/A\n", + "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Epoch duration: 0:01:16.973170\n", + "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Estimated training time remaining: 7:27:46\n", + "2023-04-07 00:05:43,648 - INFO - allennlp.training.trainer - Epoch 58/399\n", + "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:05:43,656 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9595, LAS: 0.9153, UEM: 0.8286, LEM: 0.6638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0595, partial_loss/deprel_loss: 0.1632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3132, loss: 0.6007, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 3%|2 | 3/111 [00:02<01:31, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9561, LAS: 0.9084, UEM: 0.7561, LEM: 0.5438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3785, partial_loss/deprel_loss: 0.5578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6717, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 5%|5 | 6/111 [00:04<01:24, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9398, LAS: 0.8906, UEM: 0.6781, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8015, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 8%|8 | 9/111 [00:06<01:19, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9390, LAS: 0.8898, UEM: 0.6879, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1247, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4267, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||: 11%|# | 12/111 [00:09<01:16, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9394, LAS: 0.8893, UEM: 0.6638, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||: 14%|#3 | 15/111 [00:11<01:13, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9375, LAS: 0.8866, UEM: 0.6227, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4958, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8116, batch_reg_loss: 0.1710, reg_loss: 0.1708 ||: 16%|#6 | 18/111 [00:13<01:09, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9390, LAS: 0.8878, UEM: 0.6204, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7963, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||: 19%|#8 | 21/111 [00:15<01:06, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9392, LAS: 0.8883, UEM: 0.6134, LEM: 0.3908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7934, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9666, loss: 0.7907, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||: 22%|##1 | 24/111 [00:17<01:03, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9363, LAS: 0.8847, UEM: 0.5900, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5115, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7612, loss: 0.8143, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||: 24%|##4 | 27/111 [00:19<01:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9362, LAS: 0.8844, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9451, partial_loss/deprel_loss: 0.7701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9762, loss: 0.8149, batch_reg_loss: 0.1712, reg_loss: 0.1709 ||: 28%|##7 | 31/111 [00:22<00:55, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9355, LAS: 0.8831, UEM: 0.5606, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8069, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9223, loss: 0.8263, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||: 31%|### | 34/111 [00:24<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9365, LAS: 0.8844, UEM: 0.5572, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.6048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7657, loss: 0.8172, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||: 33%|###3 | 37/111 [00:26<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9357, LAS: 0.8834, UEM: 0.5464, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0234, loss: 0.8234, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||: 37%|###6 | 41/111 [00:29<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9355, LAS: 0.8831, UEM: 0.5659, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2456, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.8257, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||: 40%|###9 | 44/111 [00:31<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9308, LAS: 0.8782, UEM: 0.5494, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9662, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 0.8680, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||: 43%|####3 | 48/111 [00:33<00:42, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9301, LAS: 0.8776, UEM: 0.5468, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3291, partial_loss/deprel_loss: 0.4619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.8733, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||: 46%|####5 | 51/111 [00:36<00:42, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9301, LAS: 0.8774, UEM: 0.5459, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2580, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5641, loss: 0.8732, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||: 49%|####8 | 54/111 [00:38<00:39, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9303, LAS: 0.8775, UEM: 0.5463, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9609, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0534, loss: 0.8687, batch_reg_loss: 0.1716, reg_loss: 0.1711 ||: 51%|#####1 | 57/111 [00:40<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9323, LAS: 0.8796, UEM: 0.5627, LEM: 0.3346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6973, loss: 0.8529, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||: 55%|#####4 | 61/111 [00:42<00:34, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9310, LAS: 0.8782, UEM: 0.5520, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1179, partial_loss/deprel_loss: 0.8586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0821, loss: 0.8627, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||: 59%|#####8 | 65/111 [00:45<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9320, LAS: 0.8792, UEM: 0.5555, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5933, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8227, loss: 0.8550, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||: 61%|######1 | 68/111 [00:47<00:29, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9326, LAS: 0.8796, UEM: 0.5645, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.8516, batch_reg_loss: 0.1718, reg_loss: 0.1712 ||: 64%|######3 | 71/111 [00:49<00:28, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9329, LAS: 0.8797, UEM: 0.5560, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6251, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9015, loss: 0.8517, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||: 68%|######7 | 75/111 [00:52<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9324, LAS: 0.8787, UEM: 0.5451, LEM: 0.3162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0988, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1186, loss: 0.8610, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9328, LAS: 0.8791, UEM: 0.5434, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3353, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||: 74%|#######3 | 82/111 [00:57<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9323, LAS: 0.8787, UEM: 0.5416, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9362, loss: 0.8612, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||: 77%|#######6 | 85/111 [00:59<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9317, LAS: 0.8779, UEM: 0.5354, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.8666, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||: 79%|#######9 | 88/111 [01:01<00:15, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9319, LAS: 0.8783, UEM: 0.5453, LEM: 0.3187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1393, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.8646, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||: 83%|########2 | 92/111 [01:04<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9318, LAS: 0.8782, UEM: 0.5385, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9511, partial_loss/deprel_loss: 0.9121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0920, loss: 0.8661, batch_reg_loss: 0.1721, reg_loss: 0.1714 ||: 86%|########6 | 96/111 [01:06<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9316, LAS: 0.8780, UEM: 0.5317, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6062, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8335, loss: 0.8693, batch_reg_loss: 0.1722, reg_loss: 0.1714 ||: 90%|######### | 100/111 [01:09<00:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9321, LAS: 0.8787, UEM: 0.5358, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2498, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.8622, batch_reg_loss: 0.1722, reg_loss: 0.1715 ||: 94%|#########3| 104/111 [01:11<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9325, LAS: 0.8791, UEM: 0.5368, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.7346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8835, loss: 0.8581, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 96%|#########6| 107/111 [01:13<00:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.436 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.278 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UEM | 0.533 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - LAS | 0.878 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - loss | 0.865 | N/A\n", + "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEM | 0.307 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EM | 0.913 | N/A\n", + "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Epoch duration: 0:01:16.613383\n", + "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Estimated training time remaining: 7:26:16\n", + "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Epoch 59/399\n", + "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:07:00,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:07:00,270 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9336, LAS: 0.8775, UEM: 0.3808, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7637, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.8668, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 4%|3 | 4/111 [00:02<01:07, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9333, LAS: 0.8780, UEM: 0.5207, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5761, loss: 0.8606, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 6%|6 | 7/111 [00:04<01:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8552, UAS: 0.9347, LAS: 0.8794, UEM: 0.4916, LEM: 0.2364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9107, partial_loss/deprel_loss: 0.8228, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0128, loss: 0.8498, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||: 9%|9 | 10/111 [00:06<01:07, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9266, LAS: 0.8729, UEM: 0.4409, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3004, partial_loss/deprel_loss: 0.9704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8981, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||: 12%|#1 | 13/111 [00:08<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9335, LAS: 0.8811, UEM: 0.5484, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.8355, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||: 14%|#4 | 16/111 [00:11<01:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9277, LAS: 0.8738, UEM: 0.4982, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9376, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4295, loss: 0.8938, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||: 18%|#8 | 20/111 [00:13<01:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9292, LAS: 0.8751, UEM: 0.5387, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4109, loss: 0.8872, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||: 21%|## | 23/111 [00:15<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9307, LAS: 0.8770, UEM: 0.5338, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.8721, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||: 23%|##3 | 26/111 [00:18<01:01, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8759, UEM: 0.5318, LEM: 0.3076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7775, loss: 0.8817, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||: 26%|##6 | 29/111 [00:20<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9292, LAS: 0.8753, UEM: 0.5118, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8447, partial_loss/deprel_loss: 0.8250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0018, loss: 0.8869, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||: 29%|##8 | 32/111 [00:22<00:55, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9321, LAS: 0.8791, UEM: 0.5550, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5100, loss: 0.8576, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||: 32%|###1 | 35/111 [00:24<00:54, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9342, LAS: 0.8816, UEM: 0.5933, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0539, partial_loss/deprel_loss: 0.1786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3265, loss: 0.8401, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||: 34%|###4 | 38/111 [00:27<00:56, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9332, LAS: 0.8807, UEM: 0.5845, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9054, loss: 0.8468, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||: 37%|###6 | 41/111 [00:29<00:52, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9329, LAS: 0.8802, UEM: 0.5758, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 0.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1480, loss: 0.8477, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||: 40%|###9 | 44/111 [00:31<00:49, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9333, LAS: 0.8805, UEM: 0.5705, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.4947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.8465, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||: 42%|####2 | 47/111 [00:33<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9328, LAS: 0.8799, UEM: 0.5733, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.8541, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||: 46%|####5 | 51/111 [00:36<00:43, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9341, LAS: 0.8814, UEM: 0.5789, LEM: 0.3594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3308, partial_loss/deprel_loss: 0.5056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.8426, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||: 49%|####8 | 54/111 [00:38<00:41, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9337, LAS: 0.8810, UEM: 0.5784, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.4433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5823, loss: 0.8452, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||: 51%|#####1 | 57/111 [00:40<00:39, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9347, LAS: 0.8819, UEM: 0.5824, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5877, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8124, loss: 0.8381, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||: 54%|#####4 | 60/111 [00:43<00:38, 1.33it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9333, LAS: 0.8805, UEM: 0.5715, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4308, partial_loss/deprel_loss: 1.1157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3520, loss: 0.8506, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||: 57%|#####6 | 63/111 [00:45<00:35, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9334, LAS: 0.8804, UEM: 0.5614, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9261, loss: 0.8528, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||: 60%|###### | 67/111 [00:47<00:29, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9334, LAS: 0.8803, UEM: 0.5556, LEM: 0.3320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9412, partial_loss/deprel_loss: 0.8262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0225, loss: 0.8533, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||: 64%|######3 | 71/111 [00:49<00:25, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9320, LAS: 0.8785, UEM: 0.5549, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1992, partial_loss/deprel_loss: 0.3865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5224, loss: 0.8659, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||: 68%|######7 | 75/111 [00:52<00:23, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8442, UAS: 0.9316, LAS: 0.8779, UEM: 0.5463, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0091, partial_loss/deprel_loss: 0.9599, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1432, loss: 0.8711, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||: 71%|#######1 | 79/111 [00:55<00:21, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9326, LAS: 0.8789, UEM: 0.5523, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2824, partial_loss/deprel_loss: 0.4500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5900, loss: 0.8622, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||: 75%|#######4 | 83/111 [00:58<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9327, LAS: 0.8790, UEM: 0.5486, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2842, partial_loss/deprel_loss: 0.5412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6634, loss: 0.8606, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||: 77%|#######7 | 86/111 [01:00<00:17, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9320, LAS: 0.8782, UEM: 0.5492, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.8675, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||: 80%|######## | 89/111 [01:02<00:15, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9325, LAS: 0.8787, UEM: 0.5477, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.7544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 0.8624, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||: 84%|########3 | 93/111 [01:04<00:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9321, LAS: 0.8784, UEM: 0.5426, LEM: 0.3108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9823, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8656, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||: 86%|########6 | 96/111 [01:06<00:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9319, LAS: 0.8782, UEM: 0.5405, LEM: 0.3084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8675, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||: 90%|######### | 100/111 [01:09<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8785, UEM: 0.5404, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 0.6216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7748, loss: 0.8655, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||: 94%|#########3| 104/111 [01:12<00:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9324, LAS: 0.8785, UEM: 0.5361, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4727, partial_loss/deprel_loss: 0.5968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7458, loss: 0.8654, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||: 96%|#########6| 107/111 [01:14<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9322, LAS: 0.8783, UEM: 0.5396, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.7900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.8659, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||: 99%|#########9| 110/111 [01:16<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9319, LAS: 0.8779, UEM: 0.5374, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1673, partial_loss/deprel_loss: 0.9337, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1543, loss: 0.8685, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||: 100%|##########| 111/111 [01:17<00:00, 1.44it/s]\n", + "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.934 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.167 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UEM | 0.537 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LAS | 0.878 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - loss | 0.869 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEM | 0.305 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - EM | 0.837 | N/A\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Epoch duration: 0:01:17.327204\n", + "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:51\n", + "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Epoch 60/399\n", + "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:08:17,598 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9362, LAS: 0.8814, UEM: 0.3503, LEM: 0.1203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8993, loss: 0.8470, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 3%|2 | 3/111 [00:02<01:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9321, LAS: 0.8779, UEM: 0.3913, LEM: 0.1676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2081, partial_loss/deprel_loss: 0.9663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1886, loss: 0.8611, batch_reg_loss: 0.1740, reg_loss: 0.1739 ||: 6%|6 | 7/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7929, UAS: 0.9231, LAS: 0.8686, UEM: 0.3932, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0036, partial_loss/deprel_loss: 1.1850, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5227, loss: 0.9405, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 9%|9 | 10/111 [00:07<01:13, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9264, LAS: 0.8725, UEM: 0.4786, LEM: 0.2742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.9067, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||: 12%|#1 | 13/111 [00:09<01:14, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9316, LAS: 0.8780, UEM: 0.5387, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6095, partial_loss/deprel_loss: 0.6517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8174, loss: 0.8575, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||: 14%|#4 | 16/111 [00:11<01:10, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9362, LAS: 0.8836, UEM: 0.6020, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0994, partial_loss/deprel_loss: 0.2475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3920, loss: 0.8120, batch_reg_loss: 0.1742, reg_loss: 0.1740 ||: 18%|#8 | 20/111 [00:14<01:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9373, LAS: 0.8850, UEM: 0.5973, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5161, partial_loss/deprel_loss: 0.6815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8226, loss: 0.8053, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||: 22%|##1 | 24/111 [00:16<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9403, LAS: 0.8883, UEM: 0.6151, LEM: 0.3769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4976, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 0.7819, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||: 25%|##5 | 28/111 [00:19<00:54, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9413, LAS: 0.8891, UEM: 0.6076, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4554, partial_loss/deprel_loss: 0.5114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.7749, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||: 28%|##7 | 31/111 [00:21<00:54, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9397, LAS: 0.8876, UEM: 0.6007, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.7878, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||: 31%|### | 34/111 [00:23<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9376, LAS: 0.8857, UEM: 0.5841, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2452, partial_loss/deprel_loss: 0.9293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1668, loss: 0.8026, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||: 33%|###3 | 37/111 [00:25<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9343, LAS: 0.8819, UEM: 0.5689, LEM: 0.3378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8595, partial_loss/deprel_loss: 0.8019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9878, loss: 0.8301, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||: 36%|###6 | 40/111 [00:27<00:50, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8483, UAS: 0.9321, LAS: 0.8796, UEM: 0.5564, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1939, partial_loss/deprel_loss: 0.9149, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1451, loss: 0.8517, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||: 40%|###9 | 44/111 [00:30<00:47, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9335, LAS: 0.8809, UEM: 0.5663, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6075, loss: 0.8412, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||: 42%|####2 | 47/111 [00:32<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9348, LAS: 0.8828, UEM: 0.5920, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6005, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7820, loss: 0.8263, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||: 45%|####5 | 50/111 [00:35<00:47, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9329, LAS: 0.8806, UEM: 0.5860, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5709, partial_loss/deprel_loss: 1.0503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3290, loss: 0.8424, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||: 48%|####7 | 53/111 [00:38<00:45, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9336, LAS: 0.8812, UEM: 0.5811, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 0.9016, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0842, loss: 0.8390, batch_reg_loss: 0.1746, reg_loss: 0.1742 ||: 51%|#####1 | 57/111 [00:40<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9304, LAS: 0.8778, UEM: 0.5673, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2525, partial_loss/deprel_loss: 0.9174, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1591, loss: 0.8677, batch_reg_loss: 0.1746, reg_loss: 0.1743 ||: 55%|#####4 | 61/111 [00:43<00:35, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9310, LAS: 0.8782, UEM: 0.5702, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9025, partial_loss/deprel_loss: 0.9015, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0764, loss: 0.8632, batch_reg_loss: 0.1747, reg_loss: 0.1743 ||: 58%|#####7 | 64/111 [00:45<00:33, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9320, LAS: 0.8794, UEM: 0.5685, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.8545, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||: 61%|######1 | 68/111 [00:47<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9312, LAS: 0.8783, UEM: 0.5588, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.7282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9039, loss: 0.8620, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||: 64%|######3 | 71/111 [00:50<00:28, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9307, LAS: 0.8778, UEM: 0.5490, LEM: 0.3263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0077, partial_loss/deprel_loss: 0.8423, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0502, loss: 0.8669, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||: 68%|######7 | 75/111 [00:52<00:24, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9306, LAS: 0.8776, UEM: 0.5447, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.5258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6645, loss: 0.8677, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||: 70%|####### | 78/111 [00:54<00:22, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8763, UEM: 0.5389, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3530, partial_loss/deprel_loss: 0.5616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6949, loss: 0.8791, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||: 74%|#######3 | 82/111 [00:57<00:19, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9295, LAS: 0.8762, UEM: 0.5307, LEM: 0.3081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.7822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9723, loss: 0.8802, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||: 77%|#######7 | 86/111 [00:59<00:16, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9299, LAS: 0.8766, UEM: 0.5393, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.3223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4657, loss: 0.8764, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||: 81%|########1 | 90/111 [01:02<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9300, LAS: 0.8768, UEM: 0.5359, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4274, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8751, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||: 84%|########3 | 93/111 [01:05<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9306, LAS: 0.8774, UEM: 0.5408, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8691, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||: 87%|########7 | 97/111 [01:07<00:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9311, LAS: 0.8780, UEM: 0.5431, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5743, partial_loss/deprel_loss: 0.6671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8238, loss: 0.8644, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||: 90%|######### | 100/111 [01:10<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9306, LAS: 0.8773, UEM: 0.5365, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0491, partial_loss/deprel_loss: 0.9409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1378, loss: 0.8708, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||: 94%|#########3| 104/111 [01:12<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9302, LAS: 0.8767, UEM: 0.5311, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4103, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.8771, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||: 97%|#########7| 108/111 [01:14<00:01, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9305, LAS: 0.8769, UEM: 0.5294, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 0.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8986, loss: 0.8754, batch_reg_loss: 0.1754, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:09:34,322 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9379, LAS: 0.8794, UEM: 0.4599, LEM: 0.1283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5266, partial_loss/deprel_loss: 24.2651, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5174, loss: 24.7563, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9527, LAS: 0.8970, UEM: 0.6623, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 26.3179, partial_loss/cycle_loss: 0.0000, batch_loss: 21.1372, loss: 22.3640, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.11it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9426, LAS: 0.8873, UEM: 0.6137, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6098, partial_loss/deprel_loss: 34.3925, partial_loss/cycle_loss: 0.0000, batch_loss: 27.6359, loss: 26.0534, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8674, UAS: 0.9435, LAS: 0.8887, UEM: 0.5935, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0499, partial_loss/deprel_loss: 43.7402, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2022, loss: 25.6088, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.04it/s]\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.741 | 48.788\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.652 | 1.316\n", + "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - reg_loss | 0.175 | 0.000\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UEM | 0.529 | 0.641\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LAS | 0.877 | 0.891\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - loss | 0.875 | 25.957\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEM | 0.305 | 0.372\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UAS | 0.930 | 0.944\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EM | 0.873 | 0.861\n", + "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:09:49,183 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Epoch duration: 0:01:32.803051\n", + "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:52\n", + "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Epoch 61/399\n", + "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:09:50,399 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9301, LAS: 0.8725, UEM: 0.4525, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7400, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.8934, batch_reg_loss: 0.1754, reg_loss: 0.1754 ||: 3%|2 | 3/111 [00:02<01:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9359, LAS: 0.8807, UEM: 0.5602, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7916, loss: 0.8117, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||: 5%|5 | 6/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9390, LAS: 0.8858, UEM: 0.5364, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.5122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6688, loss: 0.7848, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||: 8%|8 | 9/111 [00:06<01:10, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9267, LAS: 0.8726, UEM: 0.4816, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7705, partial_loss/deprel_loss: 1.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5137, loss: 0.9004, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 11%|# | 12/111 [00:08<01:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9329, LAS: 0.8789, UEM: 0.5466, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7115, loss: 0.8472, batch_reg_loss: 0.1756, reg_loss: 0.1755 ||: 14%|#3 | 15/111 [00:10<01:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9263, LAS: 0.8721, UEM: 0.4951, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4953, partial_loss/deprel_loss: 0.9569, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2402, loss: 0.9045, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||: 17%|#7 | 19/111 [00:13<01:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9278, LAS: 0.8743, UEM: 0.5035, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.8852, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||: 20%|#9 | 22/111 [00:15<01:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9288, LAS: 0.8748, UEM: 0.4971, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2908, partial_loss/deprel_loss: 0.5508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.8829, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||: 23%|##2 | 25/111 [00:17<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9293, LAS: 0.8759, UEM: 0.5267, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2407, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.8696, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||: 25%|##5 | 28/111 [00:19<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9297, LAS: 0.8768, UEM: 0.5495, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5913, partial_loss/deprel_loss: 1.1328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4003, loss: 0.8653, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||: 28%|##7 | 31/111 [00:21<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9309, LAS: 0.8782, UEM: 0.5469, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9686, loss: 0.8547, batch_reg_loss: 0.1759, reg_loss: 0.1756 ||: 31%|### | 34/111 [00:24<00:56, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9306, LAS: 0.8777, UEM: 0.5350, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9533, partial_loss/deprel_loss: 0.8344, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.8590, batch_reg_loss: 0.1759, reg_loss: 0.1757 ||: 33%|###3 | 37/111 [00:26<00:54, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9295, LAS: 0.8769, UEM: 0.5536, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4604, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6909, loss: 0.8681, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||: 36%|###6 | 40/111 [00:28<00:53, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9295, LAS: 0.8769, UEM: 0.5425, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7018, loss: 0.8705, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||: 39%|###8 | 43/111 [00:30<00:49, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9290, LAS: 0.8759, UEM: 0.5314, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9200, loss: 0.8797, batch_reg_loss: 0.1761, reg_loss: 0.1757 ||: 42%|####2 | 47/111 [00:33<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9299, LAS: 0.8766, UEM: 0.5275, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0313, partial_loss/deprel_loss: 0.9238, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1214, loss: 0.8750, batch_reg_loss: 0.1761, reg_loss: 0.1758 ||: 46%|####5 | 51/111 [00:35<00:40, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9301, LAS: 0.8769, UEM: 0.5190, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5316, partial_loss/deprel_loss: 0.5359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8718, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||: 49%|####8 | 54/111 [00:38<00:39, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9306, LAS: 0.8773, UEM: 0.5160, LEM: 0.2865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8318, loss: 0.8682, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||: 52%|#####2 | 58/111 [00:40<00:35, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9301, LAS: 0.8768, UEM: 0.5379, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9494, partial_loss/deprel_loss: 0.8664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0593, loss: 0.8701, batch_reg_loss: 0.1763, reg_loss: 0.1758 ||: 56%|#####5 | 62/111 [00:43<00:35, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9310, LAS: 0.8777, UEM: 0.5382, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3715, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6608, loss: 0.8643, batch_reg_loss: 0.1763, reg_loss: 0.1759 ||: 59%|#####8 | 65/111 [00:45<00:32, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9318, LAS: 0.8785, UEM: 0.5475, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3592, partial_loss/deprel_loss: 0.5754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 0.8581, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||: 61%|######1 | 68/111 [00:48<00:32, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9326, LAS: 0.8792, UEM: 0.5501, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4939, partial_loss/deprel_loss: 0.6939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8303, loss: 0.8533, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||: 64%|######3 | 71/111 [00:50<00:29, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9329, LAS: 0.8796, UEM: 0.5458, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8771, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9980, loss: 0.8528, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||: 68%|######7 | 75/111 [00:52<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9329, LAS: 0.8795, UEM: 0.5392, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7339, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8561, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||: 70%|####### | 78/111 [00:54<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9331, LAS: 0.8798, UEM: 0.5351, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8542, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||: 74%|#######3 | 82/111 [00:57<00:19, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9331, LAS: 0.8796, UEM: 0.5288, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9883, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8549, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||: 77%|#######7 | 86/111 [00:59<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9325, LAS: 0.8789, UEM: 0.5258, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1699, partial_loss/deprel_loss: 0.9620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1802, loss: 0.8598, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||: 81%|########1 | 90/111 [01:02<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9327, LAS: 0.8790, UEM: 0.5229, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.7385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8827, loss: 0.8601, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||: 85%|########4 | 94/111 [01:05<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9327, LAS: 0.8789, UEM: 0.5254, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2904, partial_loss/deprel_loss: 0.4370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.8596, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||: 88%|########8 | 98/111 [01:08<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9322, LAS: 0.8783, UEM: 0.5222, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 0.8358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0177, loss: 0.8647, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||: 92%|#########1| 102/111 [01:11<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8329, UAS: 0.9325, LAS: 0.8787, UEM: 0.5388, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3338, partial_loss/deprel_loss: 0.9728, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 0.8622, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||: 95%|#########4| 105/111 [01:13<00:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9322, LAS: 0.8784, UEM: 0.5361, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.6854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8494, loss: 0.8656, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||: 98%|#########8| 109/111 [01:16<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9319, LAS: 0.8781, UEM: 0.5376, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5148, partial_loss/deprel_loss: 1.0411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 0.8674, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.041 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.515 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - reg_loss | 0.176 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UEM | 0.538 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LAS | 0.878 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - loss | 0.867 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEM | 0.305 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UAS | 0.932 | N/A\n", + "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - EM | 0.816 | N/A\n", + "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:11:10,313 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Epoch duration: 0:01:25.568982\n", + "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:11\n", + "2023-04-07 00:11:15,962 - INFO - allennlp.training.trainer - Epoch 62/399\n", + "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:11:15,970 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9461, LAS: 0.8929, UEM: 0.6482, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8178, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9265, loss: 0.7051, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 3%|2 | 3/111 [00:02<01:19, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9367, LAS: 0.8823, UEM: 0.5942, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.8175, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 6%|6 | 7/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7817, UAS: 0.9301, LAS: 0.8763, UEM: 0.5643, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2934, partial_loss/deprel_loss: 1.3399, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7076, loss: 0.8878, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||: 9%|9 | 10/111 [00:06<01:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9312, LAS: 0.8783, UEM: 0.5568, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2351, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.8788, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||: 13%|#2 | 14/111 [00:09<01:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9361, LAS: 0.8829, UEM: 0.5695, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.8412, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||: 15%|#5 | 17/111 [00:11<01:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9335, LAS: 0.8806, UEM: 0.5433, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0345, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0062, loss: 0.8508, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||: 18%|#8 | 20/111 [00:13<01:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9343, LAS: 0.8818, UEM: 0.5205, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.6173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.8428, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||: 22%|##1 | 24/111 [00:16<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9322, LAS: 0.8798, UEM: 0.4931, LEM: 0.2629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7861, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9202, loss: 0.8579, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||: 25%|##5 | 28/111 [00:18<00:55, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9330, LAS: 0.8811, UEM: 0.5272, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3901, loss: 0.8492, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||: 28%|##7 | 31/111 [00:21<00:56, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9329, LAS: 0.8809, UEM: 0.5126, LEM: 0.2930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5720, partial_loss/deprel_loss: 0.6731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8298, loss: 0.8500, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||: 31%|### | 34/111 [00:23<00:54, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9333, LAS: 0.8813, UEM: 0.5162, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5572, partial_loss/deprel_loss: 0.5714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.8451, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||: 33%|###3 | 37/111 [00:25<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9343, LAS: 0.8824, UEM: 0.5142, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4571, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.8359, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||: 36%|###6 | 40/111 [00:27<00:52, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9351, LAS: 0.8832, UEM: 0.5291, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6177, loss: 0.8277, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||: 39%|###8 | 43/111 [00:30<00:50, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9371, LAS: 0.8861, UEM: 0.5756, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.8072, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 41%|####1 | 46/111 [00:32<00:49, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9372, LAS: 0.8862, UEM: 0.5747, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0707, partial_loss/deprel_loss: 0.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0771, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 44%|####4 | 49/111 [00:34<00:47, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9382, LAS: 0.8872, UEM: 0.5813, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4093, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 0.7991, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 47%|####6 | 52/111 [00:36<00:43, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9379, LAS: 0.8868, UEM: 0.5728, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9311, partial_loss/deprel_loss: 0.9079, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 50%|##### | 56/111 [00:39<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9370, LAS: 0.8861, UEM: 0.5686, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5706, loss: 0.8109, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 53%|#####3 | 59/111 [00:41<00:36, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9375, LAS: 0.8867, UEM: 0.5667, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.6020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7437, loss: 0.8056, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||: 56%|#####5 | 62/111 [00:43<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9370, LAS: 0.8863, UEM: 0.5694, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3908, partial_loss/deprel_loss: 0.5036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6579, loss: 0.8078, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 59%|#####8 | 65/111 [00:45<00:33, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9366, LAS: 0.8859, UEM: 0.5667, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.3820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.8122, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 61%|######1 | 68/111 [00:47<00:30, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9359, LAS: 0.8850, UEM: 0.5564, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8085, partial_loss/deprel_loss: 0.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9946, loss: 0.8185, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 65%|######4 | 72/111 [00:50<00:26, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8626, UAS: 0.9351, LAS: 0.8842, UEM: 0.5619, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0201, partial_loss/deprel_loss: 0.7898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0127, loss: 0.8247, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 68%|######7 | 75/111 [00:52<00:25, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9361, LAS: 0.8853, UEM: 0.5672, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3834, partial_loss/deprel_loss: 0.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6762, loss: 0.8170, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 70%|####### | 78/111 [00:54<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9357, LAS: 0.8848, UEM: 0.5614, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 0.8223, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 74%|#######3 | 82/111 [00:57<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9364, LAS: 0.8856, UEM: 0.5646, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.5018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.8165, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 77%|#######6 | 85/111 [00:59<00:17, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9356, LAS: 0.8847, UEM: 0.5610, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8515, loss: 0.8214, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 80%|######## | 89/111 [01:01<00:14, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9349, LAS: 0.8840, UEM: 0.5549, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9371, partial_loss/deprel_loss: 0.8498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0440, loss: 0.8271, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 84%|########3 | 93/111 [01:04<00:11, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9349, LAS: 0.8841, UEM: 0.5478, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6846, partial_loss/deprel_loss: 0.6411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8266, loss: 0.8268, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 87%|########7 | 97/111 [01:06<00:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9355, LAS: 0.8848, UEM: 0.5496, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3925, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7199, loss: 0.8227, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 91%|######### | 101/111 [01:09<00:06, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9350, LAS: 0.8839, UEM: 0.5418, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5451, partial_loss/deprel_loss: 0.6392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7972, loss: 0.8280, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 95%|#########4| 105/111 [01:12<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9350, LAS: 0.8839, UEM: 0.5435, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7372, partial_loss/deprel_loss: 0.6851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8723, loss: 0.8279, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 98%|#########8| 109/111 [01:15<00:01, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9352, LAS: 0.8843, UEM: 0.5459, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2081, partial_loss/deprel_loss: 0.3644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.8251, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.364 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.208 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - reg_loss | 0.177 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UEM | 0.546 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LAS | 0.884 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - loss | 0.825 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEM | 0.321 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UAS | 0.935 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EM | 0.926 | N/A\n", + "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:12:35,734 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:12:40,483 - INFO - combo.training.trainer - Epoch duration: 0:01:24.520495\n", + "2023-04-07 00:12:40,484 - INFO - combo.training.trainer - Estimated training time remaining: 7:23:22\n", + "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Epoch 63/399\n", + "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:12:40,485 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:12:40,495 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9622, LAS: 0.9136, UEM: 0.7143, LEM: 0.3932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.4429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5662, batch_reg_loss: 0.1767, reg_loss: 0.1768 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9647, LAS: 0.9167, UEM: 0.7773, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1387, partial_loss/deprel_loss: 0.3915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.5657, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 5%|5 | 6/111 [00:04<01:17, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9528, LAS: 0.9026, UEM: 0.7066, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.6629, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 9%|9 | 10/111 [00:07<01:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8438, UAS: 0.9508, LAS: 0.8998, UEM: 0.6968, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0591, partial_loss/deprel_loss: 0.9699, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1644, loss: 0.6890, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 12%|#1 | 13/111 [00:09<01:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9486, LAS: 0.8977, UEM: 0.6604, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7111, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 15%|#5 | 17/111 [00:11<01:04, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9484, LAS: 0.8977, UEM: 0.6432, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.7174, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 19%|#8 | 21/111 [00:14<01:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9471, LAS: 0.8968, UEM: 0.6249, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3350, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5877, loss: 0.7248, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 22%|##1 | 24/111 [00:16<01:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9458, LAS: 0.8951, UEM: 0.6095, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3742, partial_loss/deprel_loss: 0.5653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7037, loss: 0.7378, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||: 24%|##4 | 27/111 [00:18<00:58, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9469, LAS: 0.8963, UEM: 0.6098, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2797, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.7258, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 28%|##7 | 31/111 [00:21<00:54, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9419, LAS: 0.8912, UEM: 0.5994, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3695, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6213, loss: 0.7673, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 31%|### | 34/111 [00:23<00:54, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9405, LAS: 0.8897, UEM: 0.5848, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.7788, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 33%|###3 | 37/111 [00:25<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9384, LAS: 0.8874, UEM: 0.5624, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9695, partial_loss/deprel_loss: 0.7204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9468, loss: 0.7958, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 37%|###6 | 41/111 [00:28<00:49, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9389, LAS: 0.8880, UEM: 0.5617, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5843, loss: 0.7929, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 40%|###9 | 44/111 [00:30<00:48, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9394, LAS: 0.8883, UEM: 0.5660, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5540, partial_loss/deprel_loss: 0.6572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8132, loss: 0.7888, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 42%|####2 | 47/111 [00:33<00:47, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9408, LAS: 0.8902, UEM: 0.5851, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4763, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7508, loss: 0.7764, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 45%|####5 | 50/111 [00:35<00:47, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9396, LAS: 0.8890, UEM: 0.5734, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9640, partial_loss/deprel_loss: 0.7751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7859, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 48%|####7 | 53/111 [00:38<00:44, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9395, LAS: 0.8891, UEM: 0.5686, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4899, partial_loss/deprel_loss: 0.5436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7095, loss: 0.7854, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 50%|##### | 56/111 [00:40<00:41, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9399, LAS: 0.8895, UEM: 0.5699, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2513, partial_loss/deprel_loss: 0.4202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.7826, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 53%|#####3 | 59/111 [00:42<00:39, 1.30it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9391, LAS: 0.8886, UEM: 0.5616, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.7914, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 56%|#####5 | 62/111 [00:44<00:36, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9392, LAS: 0.8885, UEM: 0.5575, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7910, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 59%|#####9 | 66/111 [00:47<00:32, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9386, LAS: 0.8878, UEM: 0.5526, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9313, loss: 0.7982, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||: 62%|######2 | 69/111 [00:49<00:29, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9385, LAS: 0.8875, UEM: 0.5494, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6389, loss: 0.8003, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||: 65%|######4 | 72/111 [00:51<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9390, LAS: 0.8885, UEM: 0.5791, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4339, loss: 0.7948, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||: 68%|######7 | 75/111 [00:54<00:27, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9369, LAS: 0.8863, UEM: 0.5684, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7013, partial_loss/deprel_loss: 0.9147, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8097, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||: 71%|#######1 | 79/111 [00:56<00:23, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9371, LAS: 0.8866, UEM: 0.5699, LEM: 0.3353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5090, loss: 0.8084, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 75%|#######4 | 83/111 [00:59<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9383, LAS: 0.8878, UEM: 0.5797, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1914, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.7984, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 78%|#######8 | 87/111 [01:02<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9379, LAS: 0.8874, UEM: 0.5752, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3438, partial_loss/deprel_loss: 0.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.8011, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 82%|########1 | 91/111 [01:04<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9383, LAS: 0.8878, UEM: 0.5733, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3745, partial_loss/deprel_loss: 0.4885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6422, loss: 0.7969, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 85%|########4 | 94/111 [01:06<00:11, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9383, LAS: 0.8879, UEM: 0.5673, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 0.7441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.7961, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 88%|########8 | 98/111 [01:09<00:08, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9386, LAS: 0.8882, UEM: 0.5673, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.7950, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 92%|#########1| 102/111 [01:12<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9391, LAS: 0.8888, UEM: 0.5696, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2042, partial_loss/deprel_loss: 0.3583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7909, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 95%|#########4| 105/111 [01:14<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9389, LAS: 0.8884, UEM: 0.5633, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.7096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.7945, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 98%|#########8| 109/111 [01:16<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8158, UAS: 0.9386, LAS: 0.8880, UEM: 0.5631, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5034, partial_loss/deprel_loss: 1.0496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3169, loss: 0.7973, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 1.050 | N/A\n", + "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.503 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - reg_loss | 0.177 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UEM | 0.563 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LAS | 0.888 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - loss | 0.797 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEM | 0.323 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UAS | 0.939 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EM | 0.816 | N/A\n", + "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:14:00,976 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Epoch duration: 0:01:27.085147\n", + "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:46\n", + "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Epoch 64/399\n", + "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:14:07,579 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9424, LAS: 0.8965, UEM: 0.7553, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.5698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7159, loss: 0.7365, batch_reg_loss: 0.1765, reg_loss: 0.1765 ||: 3%|2 | 3/111 [00:02<01:20, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9456, LAS: 0.8991, UEM: 0.6562, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4812, partial_loss/deprel_loss: 0.5967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7501, loss: 0.7251, batch_reg_loss: 0.1764, reg_loss: 0.1765 ||: 6%|6 | 7/111 [00:04<01:13, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9400, LAS: 0.8915, UEM: 0.5800, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.5672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7133, loss: 0.7932, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 10%|9 | 11/111 [00:07<01:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9398, LAS: 0.8908, UEM: 0.5572, LEM: 0.3242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3106, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6202, loss: 0.7940, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 13%|#2 | 14/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9379, LAS: 0.8888, UEM: 0.5385, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.8111, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 15%|#5 | 17/111 [00:11<01:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9404, LAS: 0.8915, UEM: 0.5680, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.7857, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 18%|#8 | 20/111 [00:14<01:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.9377, LAS: 0.8885, UEM: 0.5705, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2371, partial_loss/deprel_loss: 1.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7132, loss: 0.8161, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 21%|## | 23/111 [00:16<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9395, LAS: 0.8902, UEM: 0.5696, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4209, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6505, loss: 0.8001, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9428, LAS: 0.8938, UEM: 0.6109, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7724, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 26%|##6 | 29/111 [00:20<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9427, LAS: 0.8934, UEM: 0.6043, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8892, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9644, loss: 0.7738, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 29%|##8 | 32/111 [00:22<00:55, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9429, LAS: 0.8938, UEM: 0.5867, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4316, partial_loss/deprel_loss: 0.5089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6698, loss: 0.7712, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 32%|###2 | 36/111 [00:25<00:51, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9414, LAS: 0.8917, UEM: 0.5679, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9932, partial_loss/deprel_loss: 0.8972, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.7831, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 36%|###6 | 40/111 [00:27<00:46, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9402, LAS: 0.8901, UEM: 0.5609, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4805, partial_loss/deprel_loss: 1.1199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3684, loss: 0.7962, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||: 40%|###9 | 44/111 [00:30<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9421, LAS: 0.8927, UEM: 0.5967, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2505, partial_loss/deprel_loss: 0.4069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.7783, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 43%|####3 | 48/111 [00:33<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9430, LAS: 0.8937, UEM: 0.5972, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2783, partial_loss/deprel_loss: 0.5068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.7690, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 47%|####6 | 52/111 [00:36<00:41, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9428, LAS: 0.8935, UEM: 0.5909, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7704, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 50%|##### | 56/111 [00:38<00:37, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9439, LAS: 0.8947, UEM: 0.6005, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7624, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 53%|#####3 | 59/111 [00:40<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9417, LAS: 0.8926, UEM: 0.5902, LEM: 0.3526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6636, partial_loss/deprel_loss: 0.9961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3059, loss: 0.7789, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 56%|#####5 | 62/111 [00:42<00:33, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9413, LAS: 0.8921, UEM: 0.5894, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.8454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0559, loss: 0.7818, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 59%|#####8 | 65/111 [00:45<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9409, LAS: 0.8915, UEM: 0.5879, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.7857, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 61%|######1 | 68/111 [00:47<00:30, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9415, LAS: 0.8921, UEM: 0.5966, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7684, partial_loss/deprel_loss: 0.6968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8874, loss: 0.7806, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 64%|######3 | 71/111 [00:49<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9415, LAS: 0.8920, UEM: 0.5889, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.7809, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 68%|######7 | 75/111 [00:52<00:25, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9410, LAS: 0.8913, UEM: 0.5785, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9618, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0183, loss: 0.7868, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||: 71%|#######1 | 79/111 [00:54<00:20, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9413, LAS: 0.8918, UEM: 0.5854, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0032, loss: 0.7828, batch_reg_loss: 0.1762, reg_loss: 0.1764 ||: 75%|#######4 | 83/111 [00:57<00:18, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9416, LAS: 0.8921, UEM: 0.5822, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3736, partial_loss/deprel_loss: 0.5020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.7811, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 78%|#######8 | 87/111 [01:00<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9419, LAS: 0.8924, UEM: 0.5824, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2289, partial_loss/deprel_loss: 0.3876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.7777, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 81%|########1 | 90/111 [01:02<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9424, LAS: 0.8931, UEM: 0.5877, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.5226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.7721, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 84%|########3 | 93/111 [01:04<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9426, LAS: 0.8934, UEM: 0.5861, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3260, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.7709, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 87%|########7 | 97/111 [01:07<00:09, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9416, LAS: 0.8925, UEM: 0.5812, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8202, partial_loss/deprel_loss: 0.9301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2843, loss: 0.7767, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 91%|######### | 101/111 [01:09<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9417, LAS: 0.8925, UEM: 0.5748, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9002, loss: 0.7791, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 95%|#########4| 105/111 [01:12<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9416, LAS: 0.8923, UEM: 0.5710, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9018, loss: 0.7798, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 97%|#########7| 108/111 [01:14<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.802 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.915 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - reg_loss | 0.176 | N/A\n", + "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UEM | 0.565 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LAS | 0.892 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - loss | 0.785 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEM | 0.329 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - UAS | 0.941 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EM | 0.855 | N/A\n", + "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:15:27,598 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:15:34,868 - INFO - combo.training.trainer - Epoch duration: 0:01:27.298867\n", + "2023-04-07 00:15:34,869 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:09\n", + "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Epoch 65/399\n", + "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:15:34,876 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9502, LAS: 0.9006, UEM: 0.4792, LEM: 0.2152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.4806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6294, loss: 0.7186, batch_reg_loss: 0.1762, reg_loss: 0.1762 ||: 3%|2 | 3/111 [00:02<01:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9285, LAS: 0.8794, UEM: 0.3964, LEM: 0.1731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6617, partial_loss/deprel_loss: 0.5697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.8714, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 5%|5 | 6/111 [00:04<01:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9329, LAS: 0.8837, UEM: 0.4081, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5837, partial_loss/deprel_loss: 0.6297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7967, loss: 0.8328, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 8%|8 | 9/111 [00:06<01:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9340, LAS: 0.8848, UEM: 0.4359, LEM: 0.2012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1888, partial_loss/deprel_loss: 0.8942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8237, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 12%|#1 | 13/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9390, LAS: 0.8905, UEM: 0.5050, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.7799, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 14%|#4 | 16/111 [00:11<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9417, LAS: 0.8939, UEM: 0.5398, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4567, partial_loss/deprel_loss: 0.5314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 0.7536, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 17%|#7 | 19/111 [00:13<01:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9426, LAS: 0.8944, UEM: 0.5453, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5512, partial_loss/deprel_loss: 0.5817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.7517, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 20%|#9 | 22/111 [00:15<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9405, LAS: 0.8917, UEM: 0.5186, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9198, partial_loss/deprel_loss: 0.7851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9881, loss: 0.7773, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 23%|##2 | 25/111 [00:17<01:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9414, LAS: 0.8929, UEM: 0.5435, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.7677, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 25%|##5 | 28/111 [00:19<00:57, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9427, LAS: 0.8947, UEM: 0.5851, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0904, partial_loss/deprel_loss: 0.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3692, loss: 0.7532, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 28%|##7 | 31/111 [00:22<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9421, LAS: 0.8936, UEM: 0.5740, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7529, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.7675, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 31%|### | 34/111 [00:24<00:54, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9422, LAS: 0.8932, UEM: 0.5649, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.6786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8331, loss: 0.7708, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 33%|###3 | 37/111 [00:26<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9389, LAS: 0.8896, UEM: 0.5482, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9369, partial_loss/deprel_loss: 0.8963, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0805, loss: 0.7991, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 36%|###6 | 40/111 [00:28<00:51, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9398, LAS: 0.8907, UEM: 0.5574, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2348, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5227, loss: 0.7898, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 39%|###8 | 43/111 [00:30<00:49, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9402, LAS: 0.8911, UEM: 0.5758, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0961, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4377, loss: 0.7841, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 41%|####1 | 46/111 [00:33<00:48, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9412, LAS: 0.8924, UEM: 0.5791, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.7733, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||: 44%|####4 | 49/111 [00:35<00:48, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9405, LAS: 0.8913, UEM: 0.5642, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9953, partial_loss/deprel_loss: 0.8299, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0390, loss: 0.7814, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 48%|####7 | 53/111 [00:38<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9404, LAS: 0.8914, UEM: 0.5579, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3034, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6113, loss: 0.7792, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 51%|#####1 | 57/111 [00:40<00:37, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9410, LAS: 0.8922, UEM: 0.5655, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.7743, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 54%|#####4 | 60/111 [00:42<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8935, UEM: 0.5793, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4151, partial_loss/deprel_loss: 0.4695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6346, loss: 0.7633, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 57%|#####6 | 63/111 [00:45<00:35, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9420, LAS: 0.8940, UEM: 0.6043, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0402, partial_loss/deprel_loss: 0.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2840, loss: 0.7604, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 59%|#####9 | 66/111 [00:47<00:34, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9424, LAS: 0.8945, UEM: 0.6072, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8798, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9271, loss: 0.7567, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 62%|######2 | 69/111 [00:50<00:32, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9417, LAS: 0.8937, UEM: 0.5964, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9134, partial_loss/deprel_loss: 0.6988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9177, loss: 0.7623, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 66%|######5 | 73/111 [00:52<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9425, LAS: 0.8946, UEM: 0.6038, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8754, partial_loss/deprel_loss: 0.7352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9392, loss: 0.7569, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 69%|######9 | 77/111 [00:57<00:30, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9430, LAS: 0.8949, UEM: 0.6048, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2401, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.7545, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||: 72%|#######2 | 80/111 [01:00<00:26, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8322, UAS: 0.9423, LAS: 0.8940, UEM: 0.6014, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3299, partial_loss/deprel_loss: 1.0192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2573, loss: 0.7618, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||: 75%|#######4 | 83/111 [01:02<00:22, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9428, LAS: 0.8945, UEM: 0.6022, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8188, partial_loss/deprel_loss: 0.7814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9648, loss: 0.7589, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||: 78%|#######8 | 87/111 [01:04<00:18, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9432, LAS: 0.8950, UEM: 0.6033, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4792, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.7550, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||: 81%|########1 | 90/111 [01:06<00:15, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9432, LAS: 0.8948, UEM: 0.5973, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7809, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0012, loss: 0.7570, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 85%|########4 | 94/111 [01:09<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9430, LAS: 0.8947, UEM: 0.5933, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0805, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9900, loss: 0.7587, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 87%|########7 | 97/111 [01:11<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9429, LAS: 0.8944, UEM: 0.5915, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6612, partial_loss/deprel_loss: 0.7524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9101, loss: 0.7615, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 91%|######### | 101/111 [01:14<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9425, LAS: 0.8939, UEM: 0.5845, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2449, partial_loss/deprel_loss: 0.8082, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0714, loss: 0.7650, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 95%|#########4| 105/111 [01:16<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9423, LAS: 0.8940, UEM: 0.5795, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6016, loss: 0.7645, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 98%|#########8| 109/111 [01:18<00:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9422, LAS: 0.8938, UEM: 0.5751, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6651, partial_loss/deprel_loss: 0.6879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8592, loss: 0.7658, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 100%|##########| 111/111 [01:20<00:00, 1.39it/s]\n", + "2023-04-07 00:16:58,127 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9622, LAS: 0.9118, UEM: 0.7073, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 24.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5125, loss: 18.2181, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9523, LAS: 0.9049, UEM: 0.7137, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2693, partial_loss/deprel_loss: 48.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 38.9773, loss: 22.4714, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9472, LAS: 0.8970, UEM: 0.6454, LEM: 0.3894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 43.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9260, loss: 24.5970, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.02it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9499, LAS: 0.8993, UEM: 0.6645, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4265, partial_loss/deprel_loss: 24.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7356, loss: 24.1319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9448, LAS: 0.8937, UEM: 0.6475, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6012, partial_loss/deprel_loss: 57.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 46.4244, loss: 25.8467, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.01it/s]\n", + "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.688 | 57.630\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.665 | 1.601\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - reg_loss | 0.176 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UEM | 0.575 | 0.648\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LAS | 0.894 | 0.894\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - loss | 0.766 | 25.847\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEM | 0.343 | 0.381\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | 0.945\n", + "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - EM | 0.883 | 0.827\n", + "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:17:10,958 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:17:15,921 - INFO - combo.training.trainer - Epoch duration: 0:01:41.052355\n", + "2023-04-07 00:17:15,922 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:41\n", + "2023-04-07 00:17:15,928 - INFO - allennlp.training.trainer - Epoch 66/399\n", + "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:17:15,938 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9503, LAS: 0.9045, UEM: 0.6977, LEM: 0.5070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1065, partial_loss/deprel_loss: 0.2698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4130, loss: 0.6921, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||: 3%|2 | 3/111 [00:02<01:20, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9330, LAS: 0.8820, UEM: 0.5288, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8724, partial_loss/deprel_loss: 0.7974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 0.8708, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||: 6%|6 | 7/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9319, LAS: 0.8828, UEM: 0.4824, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5042, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8339, loss: 0.8558, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||: 10%|9 | 11/111 [00:07<01:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9382, LAS: 0.8904, UEM: 0.5645, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.7947, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||: 13%|#2 | 14/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8779, UAS: 0.9392, LAS: 0.8913, UEM: 0.5810, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7095, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9165, loss: 0.7856, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||: 15%|#5 | 17/111 [00:11<01:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9393, LAS: 0.8918, UEM: 0.5778, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2544, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.7788, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 18%|#8 | 20/111 [00:13<01:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9420, LAS: 0.8949, UEM: 0.5900, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2620, partial_loss/deprel_loss: 0.4336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5751, loss: 0.7566, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 21%|## | 23/111 [00:16<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9413, LAS: 0.8942, UEM: 0.5750, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.7582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.7636, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 23%|##3 | 26/111 [00:18<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9425, LAS: 0.8950, UEM: 0.5722, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6922, partial_loss/deprel_loss: 0.7588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9213, loss: 0.7595, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 26%|##6 | 29/111 [00:20<00:58, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9426, LAS: 0.8947, UEM: 0.5539, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.7658, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 30%|##9 | 33/111 [00:22<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9409, LAS: 0.8928, UEM: 0.5364, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2077, partial_loss/deprel_loss: 0.7697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0331, loss: 0.7801, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 32%|###2 | 36/111 [00:25<00:53, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9417, LAS: 0.8936, UEM: 0.5383, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6008, partial_loss/deprel_loss: 0.6349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8038, loss: 0.7737, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 35%|###5 | 39/111 [00:27<00:50, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9419, LAS: 0.8937, UEM: 0.5330, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7104, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8568, loss: 0.7698, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 39%|###8 | 43/111 [00:30<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9435, LAS: 0.8958, UEM: 0.5762, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.7536, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 41%|####1 | 46/111 [00:32<00:49, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9450, LAS: 0.8975, UEM: 0.6032, LEM: 0.3863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 0.7388, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||: 44%|####4 | 49/111 [00:35<00:50, 1.22it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9446, LAS: 0.8970, UEM: 0.5923, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5940, partial_loss/deprel_loss: 0.6613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.7427, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 47%|####6 | 52/111 [00:37<00:46, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8753, UAS: 0.9449, LAS: 0.8972, UEM: 0.5905, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9129, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9636, loss: 0.7413, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 50%|##### | 56/111 [00:40<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9460, LAS: 0.8985, UEM: 0.6008, LEM: 0.3761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.7311, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 53%|#####3 | 59/111 [00:42<00:38, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9449, LAS: 0.8970, UEM: 0.5994, LEM: 0.3741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9877, partial_loss/deprel_loss: 0.8369, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0427, loss: 0.7406, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 56%|#####5 | 62/111 [00:44<00:36, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9420, LAS: 0.8940, UEM: 0.5910, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7323, partial_loss/deprel_loss: 0.9653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2944, loss: 0.7644, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 59%|#####8 | 65/111 [00:46<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9423, LAS: 0.8944, UEM: 0.5933, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.3056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4558, loss: 0.7605, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 61%|######1 | 68/111 [00:49<00:31, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9416, LAS: 0.8937, UEM: 0.5844, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5059, partial_loss/deprel_loss: 0.5656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.7655, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 65%|######4 | 72/111 [00:51<00:27, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9416, LAS: 0.8939, UEM: 0.5826, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8336, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8705, loss: 0.7631, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 68%|######7 | 75/111 [00:53<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9426, LAS: 0.8951, UEM: 0.5931, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.7539, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 70%|####### | 78/111 [00:56<00:24, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9429, LAS: 0.8955, UEM: 0.5893, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6002, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.7525, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||: 74%|#######3 | 82/111 [00:58<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9429, LAS: 0.8955, UEM: 0.5864, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3258, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.7537, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||: 77%|#######6 | 85/111 [01:00<00:18, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9425, LAS: 0.8951, UEM: 0.5812, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7507, partial_loss/deprel_loss: 0.7151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8979, loss: 0.7580, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||: 79%|#######9 | 88/111 [01:02<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9421, LAS: 0.8945, UEM: 0.5720, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8087, loss: 0.7620, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||: 83%|########2 | 92/111 [01:05<00:13, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9420, LAS: 0.8944, UEM: 0.5703, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.7642, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||: 86%|########5 | 95/111 [01:07<00:11, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8944, UEM: 0.5656, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.7654, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 88%|########8 | 98/111 [01:09<00:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9425, LAS: 0.8950, UEM: 0.5688, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.7615, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 91%|######### | 101/111 [01:12<00:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8398, UAS: 0.9421, LAS: 0.8945, UEM: 0.5678, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2186, partial_loss/deprel_loss: 0.9452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.7646, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 95%|#########4| 105/111 [01:14<00:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9422, LAS: 0.8945, UEM: 0.5710, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1337, partial_loss/deprel_loss: 0.8690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0975, loss: 0.7643, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 97%|#########7| 108/111 [01:16<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9424, LAS: 0.8947, UEM: 0.5696, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4207, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.7623, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 100%|##########| 111/111 [01:18<00:00, 1.41it/s]\n", + "2023-04-07 00:18:37,817 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.538 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.421 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - reg_loss | 0.176 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UEM | 0.570 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - LAS | 0.895 | N/A\n", + "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - loss | 0.762 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEM | 0.341 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - UAS | 0.942 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EM | 0.905 | N/A\n", + "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:18:37,824 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Epoch duration: 0:01:27.828285\n", + "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:02\n", + "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Epoch 67/399\n", + "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:18:43,757 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:18:43,764 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9642, LAS: 0.9136, UEM: 0.7103, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4133, partial_loss/deprel_loss: 0.5074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.5930, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||: 3%|2 | 3/111 [00:02<01:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9569, LAS: 0.9091, UEM: 0.6867, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8104, partial_loss/deprel_loss: 0.7143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.6318, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||: 5%|5 | 6/111 [00:04<01:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9488, LAS: 0.9010, UEM: 0.6200, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.7593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9463, loss: 0.6963, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||: 8%|8 | 9/111 [00:06<01:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9508, LAS: 0.9041, UEM: 0.6444, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5798, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6720, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||: 11%|# | 12/111 [00:08<01:12, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9467, LAS: 0.8998, UEM: 0.6254, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4919, partial_loss/deprel_loss: 0.8657, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1665, loss: 0.7057, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||: 14%|#3 | 15/111 [00:10<01:10, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9469, LAS: 0.8998, UEM: 0.6047, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5035, partial_loss/deprel_loss: 0.5987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7078, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||: 16%|#6 | 18/111 [00:12<01:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9442, LAS: 0.8963, UEM: 0.5739, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7310, partial_loss/deprel_loss: 0.7217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8991, loss: 0.7291, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 20%|#9 | 22/111 [00:15<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9430, LAS: 0.8945, UEM: 0.5612, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6500, loss: 0.7442, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 23%|##3 | 26/111 [00:18<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9418, LAS: 0.8931, UEM: 0.5430, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.7788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.7568, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 26%|##6 | 29/111 [00:20<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9410, LAS: 0.8926, UEM: 0.5419, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.7624, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 29%|##8 | 32/111 [00:22<00:54, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9414, LAS: 0.8931, UEM: 0.5294, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.7629, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 32%|###2 | 36/111 [00:24<00:50, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9408, LAS: 0.8920, UEM: 0.5319, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2387, partial_loss/deprel_loss: 0.4094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.7721, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 35%|###5 | 39/111 [00:27<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9387, LAS: 0.8896, UEM: 0.5138, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7333, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9378, loss: 0.7934, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 39%|###8 | 43/111 [00:29<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9402, LAS: 0.8909, UEM: 0.5172, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4004, partial_loss/deprel_loss: 0.5476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6936, loss: 0.7838, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 42%|####2 | 47/111 [00:32<00:41, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9420, LAS: 0.8928, UEM: 0.5398, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6228, loss: 0.7686, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 46%|####5 | 51/111 [00:34<00:40, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8131, UAS: 0.9405, LAS: 0.8912, UEM: 0.5303, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9220, partial_loss/deprel_loss: 1.1761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5007, loss: 0.7840, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 49%|####8 | 54/111 [00:37<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9656, UAS: 0.9420, LAS: 0.8931, UEM: 0.5650, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0461, partial_loss/deprel_loss: 0.1304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2890, loss: 0.7724, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 51%|#####1 | 57/111 [00:39<00:40, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9416, LAS: 0.8928, UEM: 0.5562, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.6746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.7761, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 55%|#####4 | 61/111 [00:42<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9413, LAS: 0.8928, UEM: 0.5574, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.7247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9168, loss: 0.7787, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 58%|#####7 | 64/111 [00:44<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9412, LAS: 0.8928, UEM: 0.5553, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2988, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5880, loss: 0.7789, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||: 61%|######1 | 68/111 [00:46<00:29, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9407, LAS: 0.8924, UEM: 0.5512, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7505, loss: 0.7839, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 65%|######4 | 72/111 [00:49<00:26, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9412, LAS: 0.8931, UEM: 0.5510, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.7792, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 68%|######8 | 76/111 [00:51<00:22, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9425, LAS: 0.8948, UEM: 0.5767, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4055, loss: 0.7664, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 72%|#######2 | 80/111 [00:54<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9419, LAS: 0.8942, UEM: 0.5766, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3649, partial_loss/deprel_loss: 0.9268, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1898, loss: 0.7712, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 76%|#######5 | 84/111 [00:57<00:18, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9419, LAS: 0.8943, UEM: 0.5731, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8962, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9527, loss: 0.7723, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 79%|#######9 | 88/111 [01:00<00:15, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9417, LAS: 0.8942, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0678, partial_loss/deprel_loss: 0.7556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9934, loss: 0.7736, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 83%|########2 | 92/111 [01:02<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9423, LAS: 0.8947, UEM: 0.5730, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3825, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.7677, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 86%|########5 | 95/111 [01:05<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9423, LAS: 0.8947, UEM: 0.5699, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6675, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8590, loss: 0.7672, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 88%|########8 | 98/111 [01:07<00:09, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9425, LAS: 0.8949, UEM: 0.5694, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7032, loss: 0.7656, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 91%|######### | 101/111 [01:09<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9427, LAS: 0.8950, UEM: 0.5679, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8124, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9671, loss: 0.7648, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 94%|#########3| 104/111 [01:12<00:05, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9427, LAS: 0.8950, UEM: 0.5721, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1232, partial_loss/deprel_loss: 0.8301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0640, loss: 0.7638, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||: 96%|#########6| 107/111 [01:14<00:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.533 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.443 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - reg_loss | 0.175 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UEM | 0.571 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LAS | 0.895 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - loss | 0.762 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEM | 0.339 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UAS | 0.943 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EM | 0.898 | N/A\n", + "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:20:03,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Epoch duration: 0:01:24.945331\n", + "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Estimated training time remaining: 7:21:09\n", + "2023-04-07 00:20:08,702 - INFO - allennlp.training.trainer - Epoch 68/399\n", + "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:20:08,712 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9535, LAS: 0.9120, UEM: 0.6017, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5809, loss: 0.6322, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 4%|3 | 4/111 [00:02<01:05, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9387, LAS: 0.8935, UEM: 0.5898, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9282, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4375, loss: 0.7649, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 7%|7 | 8/111 [00:05<01:05, 1.57it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9419, LAS: 0.8966, UEM: 0.6199, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1184, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4087, loss: 0.7419, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 10%|9 | 11/111 [00:07<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9371, LAS: 0.8921, UEM: 0.6124, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 0.7199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.7698, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 13%|#2 | 14/111 [00:09<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9398, LAS: 0.8943, UEM: 0.5887, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6932, partial_loss/deprel_loss: 0.7136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 0.7637, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 16%|#6 | 18/111 [00:11<01:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9373, LAS: 0.8906, UEM: 0.5553, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4083, partial_loss/deprel_loss: 0.5014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6580, loss: 0.7922, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 20%|#9 | 22/111 [00:14<00:57, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9363, LAS: 0.8891, UEM: 0.5288, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6937, partial_loss/deprel_loss: 0.7187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8890, loss: 0.8091, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 23%|##3 | 26/111 [00:16<00:52, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9373, LAS: 0.8901, UEM: 0.5235, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3720, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.7941, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 27%|##7 | 30/111 [00:19<00:50, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9370, LAS: 0.8900, UEM: 0.5187, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1057, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9801, loss: 0.7943, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 31%|### | 34/111 [00:21<00:46, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9386, LAS: 0.8917, UEM: 0.5275, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2765, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.7792, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||: 34%|###4 | 38/111 [00:24<00:45, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9375, LAS: 0.8906, UEM: 0.5236, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.7878, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 38%|###7 | 42/111 [00:26<00:44, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9376, LAS: 0.8906, UEM: 0.5201, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.5141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.7886, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 41%|####1 | 46/111 [00:30<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9371, LAS: 0.8898, UEM: 0.5100, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8646, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9233, loss: 0.7953, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 45%|####5 | 50/111 [00:32<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9379, LAS: 0.8905, UEM: 0.5044, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.7904, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 49%|####8 | 54/111 [00:35<00:37, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9390, LAS: 0.8916, UEM: 0.5100, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8865, loss: 0.7837, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 52%|#####2 | 58/111 [00:37<00:34, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9404, LAS: 0.8931, UEM: 0.5284, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.3919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.7733, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 56%|#####5 | 62/111 [00:40<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9407, LAS: 0.8932, UEM: 0.5270, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9076, partial_loss/deprel_loss: 0.7910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7728, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 59%|#####8 | 65/111 [00:42<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9411, LAS: 0.8936, UEM: 0.5325, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7607, partial_loss/deprel_loss: 0.6914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.7690, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 61%|######1 | 68/111 [00:45<00:31, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9413, LAS: 0.8941, UEM: 0.5542, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8555, partial_loss/deprel_loss: 0.7473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.7660, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 64%|######3 | 71/111 [00:47<00:30, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9424, LAS: 0.8953, UEM: 0.5672, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2020, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5146, loss: 0.7573, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 67%|######6 | 74/111 [00:49<00:27, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9429, LAS: 0.8959, UEM: 0.5668, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3585, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.7541, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||: 69%|######9 | 77/111 [00:52<00:25, 1.33it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9430, LAS: 0.8959, UEM: 0.5699, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3904, partial_loss/deprel_loss: 0.5182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.7540, batch_reg_loss: 0.1752, reg_loss: 0.1752 ||: 72%|#######2 | 80/111 [00:54<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9431, LAS: 0.8959, UEM: 0.5689, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7975, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.7528, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 76%|#######5 | 84/111 [00:57<00:19, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9435, LAS: 0.8963, UEM: 0.5747, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7502, loss: 0.7493, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 78%|#######8 | 87/111 [00:59<00:17, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9434, LAS: 0.8962, UEM: 0.5679, LEM: 0.3372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.7515, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 82%|########1 | 91/111 [01:01<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9430, LAS: 0.8956, UEM: 0.5675, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3792, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7560, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 86%|########5 | 95/111 [01:04<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9425, LAS: 0.8951, UEM: 0.5604, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6581, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.7601, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 88%|########8 | 98/111 [01:06<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9430, LAS: 0.8956, UEM: 0.5657, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2269, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.7555, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 91%|######### | 101/111 [01:09<00:07, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9434, LAS: 0.8958, UEM: 0.5635, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.6125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7372, loss: 0.7544, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 94%|#########3| 104/111 [01:11<00:05, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9443, LAS: 0.8970, UEM: 0.5796, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1041, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3744, loss: 0.7458, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 97%|#########7| 108/111 [01:14<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9443, LAS: 0.8969, UEM: 0.5791, LEM: 0.3471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1234, partial_loss/deprel_loss: 0.8039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0429, loss: 0.7461, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.804 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.123 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - reg_loss | 0.175 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UEM | 0.579 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LAS | 0.897 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - loss | 0.746 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEM | 0.347 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UAS | 0.944 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EM | 0.867 | N/A\n", + "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:21:27,343 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Epoch duration: 0:01:22.876591\n", + "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:04\n", + "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Epoch 69/399\n", + "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:21:31,588 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9372, LAS: 0.8856, UEM: 0.3389, LEM: 0.1217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6342, loss: 0.8309, batch_reg_loss: 0.1751, reg_loss: 0.1751 ||: 4%|3 | 4/111 [00:02<01:07, 1.59it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9488, LAS: 0.9004, UEM: 0.5510, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.7200, batch_reg_loss: 0.1750, reg_loss: 0.1751 ||: 7%|7 | 8/111 [00:04<01:02, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9457, LAS: 0.8972, UEM: 0.5200, LEM: 0.2623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4084, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6509, loss: 0.7452, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 11%|# | 12/111 [00:07<01:01, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9434, LAS: 0.8948, UEM: 0.5249, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9379, partial_loss/deprel_loss: 0.8857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0712, loss: 0.7653, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 14%|#3 | 15/111 [00:09<01:02, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9402, LAS: 0.8918, UEM: 0.5390, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.7944, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 16%|#6 | 18/111 [00:11<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9430, LAS: 0.8945, UEM: 0.5717, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.7723, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 19%|#8 | 21/111 [00:14<01:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9404, LAS: 0.8918, UEM: 0.5454, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2247, partial_loss/deprel_loss: 0.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1205, loss: 0.7921, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 22%|##1 | 24/111 [00:16<01:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9382, LAS: 0.8897, UEM: 0.5276, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6034, partial_loss/deprel_loss: 0.8647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1875, loss: 0.8006, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 24%|##4 | 27/111 [00:18<00:58, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9380, LAS: 0.8899, UEM: 0.5353, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2211, partial_loss/deprel_loss: 0.3530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5016, loss: 0.8007, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 27%|##7 | 30/111 [00:20<00:59, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9380, LAS: 0.8903, UEM: 0.5375, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.7981, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 30%|##9 | 33/111 [00:22<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9395, LAS: 0.8919, UEM: 0.5439, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.7799, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 33%|###3 | 37/111 [00:25<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9400, LAS: 0.8925, UEM: 0.5530, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6196, loss: 0.7748, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 37%|###6 | 41/111 [00:28<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9632, UAS: 0.9408, LAS: 0.8937, UEM: 0.5844, LEM: 0.3672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0568, partial_loss/deprel_loss: 0.1404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2986, loss: 0.7665, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 40%|###9 | 44/111 [00:30<00:49, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9411, LAS: 0.8936, UEM: 0.5783, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2504, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.7676, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 42%|####2 | 47/111 [00:32<00:45, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9419, LAS: 0.8945, UEM: 0.5785, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8914, loss: 0.7608, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||: 46%|####5 | 51/111 [00:35<00:41, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9407, LAS: 0.8931, UEM: 0.5619, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9799, loss: 0.7714, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 50%|####9 | 55/111 [00:37<00:38, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9407, LAS: 0.8932, UEM: 0.5584, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5583, partial_loss/deprel_loss: 0.5483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7253, loss: 0.7697, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 53%|#####3 | 59/111 [00:40<00:34, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9405, LAS: 0.8928, UEM: 0.5496, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7194, partial_loss/deprel_loss: 0.7566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.7737, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 57%|#####6 | 63/111 [00:43<00:31, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9410, LAS: 0.8932, UEM: 0.5453, LEM: 0.3202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4204, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6801, loss: 0.7715, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 60%|###### | 67/111 [00:45<00:27, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9418, LAS: 0.8937, UEM: 0.5471, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3232, partial_loss/deprel_loss: 0.4991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6388, loss: 0.7663, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 64%|######3 | 71/111 [00:48<00:26, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9413, LAS: 0.8930, UEM: 0.5375, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7553, partial_loss/deprel_loss: 0.7453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9222, loss: 0.7724, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 68%|######7 | 75/111 [00:51<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9418, LAS: 0.8934, UEM: 0.5385, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5953, partial_loss/deprel_loss: 0.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8388, loss: 0.7695, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 70%|####### | 78/111 [00:53<00:24, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9427, LAS: 0.8946, UEM: 0.5573, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.7609, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 73%|#######2 | 81/111 [00:55<00:21, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9429, LAS: 0.8948, UEM: 0.5602, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8755, partial_loss/deprel_loss: 0.6715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8872, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 76%|#######5 | 84/111 [00:58<00:19, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9429, LAS: 0.8950, UEM: 0.5685, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2962, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||: 78%|#######8 | 87/111 [01:00<00:17, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9437, LAS: 0.8959, UEM: 0.5770, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2044, partial_loss/deprel_loss: 0.3830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.7520, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||: 82%|########1 | 91/111 [01:02<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9440, LAS: 0.8962, UEM: 0.5740, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4221, partial_loss/deprel_loss: 0.4896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6510, loss: 0.7511, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||: 85%|########4 | 94/111 [01:05<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9435, LAS: 0.8957, UEM: 0.5720, LEM: 0.3396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.4080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.7546, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 88%|########8 | 98/111 [01:07<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9435, LAS: 0.8959, UEM: 0.5687, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9934, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9634, loss: 0.7537, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 92%|#########1| 102/111 [01:10<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9441, LAS: 0.8966, UEM: 0.5770, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1999, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7478, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 95%|#########4| 105/111 [01:13<00:04, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9441, LAS: 0.8966, UEM: 0.5723, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.7484, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 98%|#########8| 109/111 [01:15<00:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9445, LAS: 0.8970, UEM: 0.5766, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2103, partial_loss/deprel_loss: 0.3635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.7455, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 100%|##########| 111/111 [01:16<00:00, 1.44it/s]\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.363 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.210 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - reg_loss | 0.175 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UEM | 0.577 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LAS | 0.897 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - loss | 0.746 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEM | 0.341 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UAS | 0.945 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EM | 0.925 | N/A\n", + "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:22:51,434 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Epoch duration: 0:01:24.403512\n", + "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:06\n", + "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Epoch 70/399\n", + "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:22:55,993 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9506, LAS: 0.9042, UEM: 0.5290, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6881, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6847, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||: 3%|2 | 3/111 [00:02<01:22, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9477, LAS: 0.8997, UEM: 0.5508, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.4398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7136, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||: 6%|6 | 7/111 [00:04<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9454, LAS: 0.8973, UEM: 0.5153, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8429, partial_loss/deprel_loss: 0.8392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0147, loss: 0.7399, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||: 10%|9 | 11/111 [00:07<01:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9452, LAS: 0.8978, UEM: 0.5334, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7221, loss: 0.7331, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||: 13%|#2 | 14/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9460, LAS: 0.8982, UEM: 0.5915, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1596, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0851, loss: 0.7203, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||: 16%|#6 | 18/111 [00:12<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9457, LAS: 0.8980, UEM: 0.5696, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4944, partial_loss/deprel_loss: 0.6857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8221, loss: 0.7229, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 20%|#9 | 22/111 [00:14<00:58, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9450, LAS: 0.8981, UEM: 0.5822, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1255, partial_loss/deprel_loss: 0.2653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.7276, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 23%|##3 | 26/111 [00:17<00:55, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9464, LAS: 0.8994, UEM: 0.6001, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1067, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.7160, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 27%|##7 | 30/111 [00:19<00:52, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9470, LAS: 0.9001, UEM: 0.6030, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7936, partial_loss/deprel_loss: 0.7543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9368, loss: 0.7124, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 30%|##9 | 33/111 [00:21<00:51, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9472, LAS: 0.9003, UEM: 0.6065, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7396, loss: 0.7110, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 32%|###2 | 36/111 [00:24<00:52, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9483, LAS: 0.9017, UEM: 0.6156, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.7037, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 35%|###5 | 39/111 [00:26<00:50, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9464, LAS: 0.8989, UEM: 0.5964, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5875, partial_loss/deprel_loss: 0.6289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7953, loss: 0.7232, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||: 39%|###8 | 43/111 [00:28<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9463, LAS: 0.8987, UEM: 0.5899, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8414, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8850, loss: 0.7244, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 41%|####1 | 46/111 [00:31<00:46, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9472, LAS: 0.8996, UEM: 0.5881, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.7186, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 45%|####5 | 50/111 [00:33<00:41, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9467, LAS: 0.8991, UEM: 0.5861, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.3734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.7234, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 49%|####8 | 54/111 [00:36<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9450, LAS: 0.8975, UEM: 0.5755, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5630, partial_loss/deprel_loss: 0.6081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7737, loss: 0.7364, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 51%|#####1 | 57/111 [00:38<00:37, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9450, LAS: 0.8976, UEM: 0.5710, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2503, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7372, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 55%|#####4 | 61/111 [00:41<00:34, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9442, LAS: 0.8967, UEM: 0.5627, LEM: 0.3232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9444, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0059, loss: 0.7428, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 59%|#####8 | 65/111 [00:43<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9451, LAS: 0.8978, UEM: 0.5759, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3515, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7330, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 62%|######2 | 69/111 [00:46<00:28, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9447, LAS: 0.8976, UEM: 0.5749, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3702, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.7347, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 66%|######5 | 73/111 [00:49<00:26, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9453, LAS: 0.8984, UEM: 0.5932, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6705, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.7296, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 68%|######8 | 76/111 [00:52<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9456, LAS: 0.8986, UEM: 0.5912, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3765, partial_loss/deprel_loss: 0.5242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7272, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 71%|#######1 | 79/111 [00:54<00:23, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9456, LAS: 0.8988, UEM: 0.5885, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.7257, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||: 74%|#######3 | 82/111 [00:56<00:21, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9458, LAS: 0.8988, UEM: 0.5861, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.5251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6812, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||: 77%|#######6 | 85/111 [00:58<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.8990, UEM: 0.5836, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.6249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8081, loss: 0.7242, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||: 79%|#######9 | 88/111 [01:00<00:16, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9462, LAS: 0.8994, UEM: 0.5841, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3782, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6918, loss: 0.7221, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 83%|########2 | 92/111 [01:03<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9457, LAS: 0.8989, UEM: 0.5914, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1358, partial_loss/deprel_loss: 0.2361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3906, loss: 0.7262, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 86%|########5 | 95/111 [01:05<00:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9459, LAS: 0.8990, UEM: 0.5926, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2622, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 89%|########9 | 99/111 [01:08<00:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9452, LAS: 0.8983, UEM: 0.5850, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6349, partial_loss/deprel_loss: 0.5700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7305, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 93%|#########2| 103/111 [01:10<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9447, LAS: 0.8977, UEM: 0.5808, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9583, loss: 0.7356, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 96%|#########6| 107/111 [01:12<00:02, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-07 00:24:14,896 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9488, LAS: 0.8951, UEM: 0.5461, LEM: 0.2057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4334, partial_loss/deprel_loss: 24.7874, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9166, loss: 23.9872, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9478, LAS: 0.8936, UEM: 0.5263, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5667, partial_loss/deprel_loss: 24.3909, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6260, loss: 25.3352, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:07, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8277, UAS: 0.9436, LAS: 0.8916, UEM: 0.6500, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5601, partial_loss/deprel_loss: 57.8863, partial_loss/cycle_loss: 0.0000, batch_loss: 46.6211, loss: 27.1227, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:06<00:05, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9474, LAS: 0.8963, UEM: 0.6602, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 17.6734, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2133, loss: 25.4952, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:09<00:02, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.668 | 31.017\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.549 | 0.912\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - reg_loss | 0.175 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UEM | 0.577 | 0.652\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LAS | 0.898 | 0.896\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - loss | 0.738 | 26.020\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEM | 0.345 | 0.387\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UAS | 0.944 | 0.947\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EM | 0.896 | 0.884\n", + "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:24:27,558 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Epoch duration: 0:01:36.532109\n", + "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:04\n", + "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Epoch 71/399\n", + "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:24:32,517 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:24:32,524 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9590, LAS: 0.9141, UEM: 0.6957, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1020, partial_loss/deprel_loss: 0.2615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4041, loss: 0.6331, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 4%|3 | 4/111 [00:02<01:12, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9402, LAS: 0.8957, UEM: 0.6073, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0627, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9193, loss: 0.7472, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 6%|6 | 7/111 [00:05<01:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9451, LAS: 0.9012, UEM: 0.5755, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.4493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.7071, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 10%|9 | 11/111 [00:07<01:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9442, LAS: 0.8999, UEM: 0.5837, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6201, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.7150, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 14%|#3 | 15/111 [00:10<01:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9411, LAS: 0.8963, UEM: 0.5649, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4521, partial_loss/deprel_loss: 0.5205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6813, loss: 0.7479, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 16%|#6 | 18/111 [00:12<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9401, LAS: 0.8946, UEM: 0.5597, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2594, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5830, loss: 0.7609, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 20%|#9 | 22/111 [00:15<01:01, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9421, LAS: 0.8969, UEM: 0.5898, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2663, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5626, loss: 0.7449, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 23%|##2 | 25/111 [00:17<01:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9435, LAS: 0.8984, UEM: 0.5941, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9035, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.7326, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||: 26%|##6 | 29/111 [00:19<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9435, LAS: 0.8980, UEM: 0.5835, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2197, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.7323, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 30%|##9 | 33/111 [00:22<00:51, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9419, LAS: 0.8962, UEM: 0.5642, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8650, partial_loss/deprel_loss: 0.7420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9410, loss: 0.7496, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 32%|###2 | 36/111 [00:24<00:50, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9417, LAS: 0.8960, UEM: 0.5526, LEM: 0.3200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4917, partial_loss/deprel_loss: 0.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7104, loss: 0.7502, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 35%|###5 | 39/111 [00:26<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9422, LAS: 0.8962, UEM: 0.5459, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.4688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6291, loss: 0.7475, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 39%|###8 | 43/111 [00:28<00:45, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9426, LAS: 0.8967, UEM: 0.5581, LEM: 0.3228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7444, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 42%|####2 | 47/111 [00:32<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9429, LAS: 0.8970, UEM: 0.5574, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6908, partial_loss/deprel_loss: 0.6305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8170, loss: 0.7423, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 45%|####5 | 50/111 [00:34<00:44, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9442, LAS: 0.8986, UEM: 0.5893, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4181, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5620, loss: 0.7319, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||: 48%|####7 | 53/111 [00:37<00:44, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9442, LAS: 0.8985, UEM: 0.5971, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2169, partial_loss/deprel_loss: 0.9480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1761, loss: 0.7328, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 51%|#####1 | 57/111 [00:39<00:39, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9446, LAS: 0.8990, UEM: 0.5982, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2724, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.7271, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 54%|#####4 | 60/111 [00:41<00:36, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9439, LAS: 0.8982, UEM: 0.5894, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8146, partial_loss/deprel_loss: 0.7395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9289, loss: 0.7332, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 58%|#####7 | 64/111 [00:44<00:32, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9441, LAS: 0.8983, UEM: 0.5906, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5781, loss: 0.7327, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 60%|###### | 67/111 [00:46<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9442, LAS: 0.8982, UEM: 0.5844, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.5362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6735, loss: 0.7346, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 64%|######3 | 71/111 [00:48<00:26, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9443, LAS: 0.8983, UEM: 0.5809, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4050, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6479, loss: 0.7343, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||: 68%|######7 | 75/111 [00:51<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9447, LAS: 0.8986, UEM: 0.5798, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4875, loss: 0.7322, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9449, LAS: 0.8989, UEM: 0.5804, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4958, loss: 0.7293, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9453, LAS: 0.8992, UEM: 0.5786, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2871, partial_loss/deprel_loss: 0.4169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7271, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 77%|#######7 | 86/111 [00:59<00:17, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8387, UAS: 0.9448, LAS: 0.8986, UEM: 0.5749, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3576, partial_loss/deprel_loss: 0.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1788, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 80%|######## | 89/111 [01:01<00:15, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9453, LAS: 0.8991, UEM: 0.5820, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5433, loss: 0.7274, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 84%|########3 | 93/111 [01:04<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9457, LAS: 0.8996, UEM: 0.5859, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2463, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.7239, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 86%|########6 | 96/111 [01:06<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9452, LAS: 0.8989, UEM: 0.5788, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8455, partial_loss/deprel_loss: 0.7369, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.7287, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 89%|########9 | 99/111 [01:08<00:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9451, LAS: 0.8987, UEM: 0.5735, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4627, partial_loss/deprel_loss: 0.5341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6941, loss: 0.7290, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 93%|#########2| 103/111 [01:10<00:05, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9452, LAS: 0.8988, UEM: 0.5804, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5536, partial_loss/deprel_loss: 0.6417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 0.7292, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 95%|#########5| 106/111 [01:13<00:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9449, LAS: 0.8985, UEM: 0.5797, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 98%|#########8| 109/111 [01:15<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9453, LAS: 0.8989, UEM: 0.5821, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.4372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.7289, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-07 00:25:51,826 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.437 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.246 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - reg_loss | 0.174 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UEM | 0.582 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LAS | 0.899 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - loss | 0.729 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LEM | 0.350 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - UAS | 0.945 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EM | 0.919 | N/A\n", + "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:25:51,833 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:25:58,450 - INFO - combo.training.trainer - Epoch duration: 0:01:25.934082\n", + "2023-04-07 00:25:58,451 - INFO - combo.training.trainer - Estimated training time remaining: 7:18:10\n", + "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Epoch 72/399\n", + "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:25:58,459 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9210, LAS: 0.8741, UEM: 0.1528, LEM: 0.0349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0325, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9467, loss: 0.9111, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||: 3%|2 | 3/111 [00:02<01:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9339, LAS: 0.8884, UEM: 0.3328, LEM: 0.1396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.8094, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||: 5%|5 | 6/111 [00:04<01:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9389, LAS: 0.8942, UEM: 0.3980, LEM: 0.1852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2779, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.7716, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||: 8%|8 | 9/111 [00:06<01:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9455, LAS: 0.9005, UEM: 0.5356, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2017, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4774, loss: 0.7129, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||: 11%|# | 12/111 [00:08<01:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9476, LAS: 0.9035, UEM: 0.6410, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0145, partial_loss/deprel_loss: 0.7799, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0010, loss: 0.6982, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||: 14%|#3 | 15/111 [00:11<01:14, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9487, LAS: 0.9049, UEM: 0.6574, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 16%|#6 | 18/111 [00:13<01:09, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9461, LAS: 0.9020, UEM: 0.6318, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3470, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0679, loss: 0.7139, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 20%|#9 | 22/111 [00:16<01:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9479, LAS: 0.9035, UEM: 0.6285, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.5446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7286, loss: 0.6959, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 23%|##3 | 26/111 [00:18<00:59, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9480, LAS: 0.9035, UEM: 0.6255, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5938, loss: 0.6938, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 26%|##6 | 29/111 [00:21<00:59, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9482, LAS: 0.9034, UEM: 0.6138, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.6008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7702, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 30%|##9 | 33/111 [00:23<00:55, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9489, LAS: 0.9044, UEM: 0.6279, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.6839, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 32%|###2 | 36/111 [00:26<00:55, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9488, LAS: 0.9043, UEM: 0.6230, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.6844, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||: 36%|###6 | 40/111 [00:29<00:52, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9484, LAS: 0.9035, UEM: 0.6086, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5742, partial_loss/deprel_loss: 0.5775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.6907, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 40%|###9 | 44/111 [00:31<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9482, LAS: 0.9033, UEM: 0.5955, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.6924, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 43%|####3 | 48/111 [00:33<00:41, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9474, LAS: 0.9021, UEM: 0.5940, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2345, partial_loss/deprel_loss: 0.8553, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1053, loss: 0.7012, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 47%|####6 | 52/111 [00:36<00:38, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9483, LAS: 0.9031, UEM: 0.6069, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.6941, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 50%|##### | 56/111 [00:39<00:36, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9483, LAS: 0.9028, UEM: 0.5992, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2925, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.6959, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 54%|#####4 | 60/111 [00:41<00:33, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9464, LAS: 0.9008, UEM: 0.5965, LEM: 0.3693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0754, partial_loss/deprel_loss: 0.7823, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0150, loss: 0.7112, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 58%|#####7 | 64/111 [00:44<00:31, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8076, UAS: 0.9458, LAS: 0.9003, UEM: 0.6044, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8518, partial_loss/deprel_loss: 1.1044, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4279, loss: 0.7156, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 61%|######1 | 68/111 [00:47<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9458, LAS: 0.9002, UEM: 0.6026, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8045, loss: 0.7183, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 64%|######3 | 71/111 [00:49<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9461, LAS: 0.9006, UEM: 0.6006, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3879, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.7152, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 67%|######6 | 74/111 [00:52<00:26, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9453, LAS: 0.8996, UEM: 0.5901, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5763, partial_loss/deprel_loss: 0.6045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7729, loss: 0.7218, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 70%|####### | 78/111 [00:54<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9454, LAS: 0.8994, UEM: 0.5849, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.6924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8746, loss: 0.7226, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 74%|#######3 | 82/111 [00:56<00:19, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9455, LAS: 0.8995, UEM: 0.5842, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.6244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8165, loss: 0.7207, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 77%|#######7 | 86/111 [00:59<00:16, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9446, LAS: 0.8984, UEM: 0.5772, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0883, partial_loss/deprel_loss: 0.7811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.7292, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 81%|########1 | 90/111 [01:02<00:13, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9444, LAS: 0.8984, UEM: 0.5738, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.7309, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||: 85%|########4 | 94/111 [01:04<00:11, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9445, LAS: 0.8985, UEM: 0.5741, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8477, loss: 0.7307, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||: 88%|########8 | 98/111 [01:07<00:08, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9456, LAS: 0.8997, UEM: 0.5927, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0877, partial_loss/deprel_loss: 0.2313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.7215, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||: 92%|#########1| 102/111 [01:10<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9453, LAS: 0.8995, UEM: 0.5870, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6028, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7565, loss: 0.7237, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||: 95%|#########4| 105/111 [01:12<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9456, LAS: 0.8997, UEM: 0.5861, LEM: 0.3529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4799, partial_loss/deprel_loss: 0.5671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7237, loss: 0.7223, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||: 97%|#########7| 108/111 [01:14<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:27:18,544 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.454 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.288 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - reg_loss | 0.174 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - LAS | 0.900 | N/A\n", + "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - loss | 0.722 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEM | 0.351 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - UAS | 0.946 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EM | 0.924 | N/A\n", + "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:27:18,552 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Epoch duration: 0:01:26.320285\n", + "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:18\n", + "2023-04-07 00:27:24,771 - INFO - allennlp.training.trainer - Epoch 73/399\n", + "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:27:24,779 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9532, LAS: 0.9077, UEM: 0.5342, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2385, partial_loss/deprel_loss: 0.4693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5971, loss: 0.6751, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 4%|3 | 4/111 [00:02<01:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9604, LAS: 0.9180, UEM: 0.7379, LEM: 0.5320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0522, partial_loss/deprel_loss: 0.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2945, loss: 0.5981, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 6%|6 | 7/111 [00:05<01:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9585, LAS: 0.9155, UEM: 0.6843, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3479, partial_loss/deprel_loss: 0.5002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6111, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 10%|9 | 11/111 [00:07<01:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9587, LAS: 0.9153, UEM: 0.6754, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7673, loss: 0.6098, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 13%|#2 | 14/111 [00:10<01:09, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9597, LAS: 0.9163, UEM: 0.6823, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.6001, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 15%|#5 | 17/111 [00:12<01:09, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9560, LAS: 0.9106, UEM: 0.6453, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8720, partial_loss/deprel_loss: 0.6651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.6418, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 19%|#8 | 21/111 [00:15<01:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8644, UAS: 0.9553, LAS: 0.9103, UEM: 0.6530, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0246, partial_loss/deprel_loss: 0.8085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0257, loss: 0.6453, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||: 22%|##1 | 24/111 [00:17<01:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9540, LAS: 0.9098, UEM: 0.6519, LEM: 0.4187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5992, loss: 0.6471, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 24%|##4 | 27/111 [00:19<01:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9525, LAS: 0.9076, UEM: 0.6388, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9665, partial_loss/deprel_loss: 0.7185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9421, loss: 0.6611, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 28%|##7 | 31/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9514, LAS: 0.9063, UEM: 0.6255, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.7669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9932, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 31%|### | 34/111 [00:24<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9517, LAS: 0.9066, UEM: 0.6244, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.6727, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 33%|###3 | 37/111 [00:26<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9514, LAS: 0.9063, UEM: 0.6176, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5196, partial_loss/deprel_loss: 0.5613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 36%|###6 | 40/111 [00:28<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9502, LAS: 0.9048, UEM: 0.6083, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0434, partial_loss/deprel_loss: 0.8135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0334, loss: 0.6860, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 40%|###9 | 44/111 [00:30<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9485, LAS: 0.9032, UEM: 0.5897, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9389, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 43%|####3 | 48/111 [00:33<00:41, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9485, LAS: 0.9034, UEM: 0.5817, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7179, partial_loss/deprel_loss: 0.6370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8271, loss: 0.7025, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 47%|####6 | 52/111 [00:35<00:37, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9486, LAS: 0.9035, UEM: 0.5822, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3235, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.7005, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 50%|##### | 56/111 [00:38<00:37, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9498, LAS: 0.9046, UEM: 0.6007, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6910, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 53%|#####3 | 59/111 [00:40<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9496, LAS: 0.9047, UEM: 0.6015, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.4418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6108, loss: 0.6893, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||: 56%|#####5 | 62/111 [00:43<00:34, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9491, LAS: 0.9041, UEM: 0.5914, LEM: 0.3569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6222, loss: 0.6939, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 59%|#####9 | 66/111 [00:45<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9480, LAS: 0.9030, UEM: 0.5828, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5705, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 63%|######3 | 70/111 [00:48<00:27, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9473, LAS: 0.9025, UEM: 0.5904, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8044, partial_loss/deprel_loss: 1.0041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3380, loss: 0.7049, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 67%|######6 | 74/111 [00:51<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9475, LAS: 0.9027, UEM: 0.5984, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5672, partial_loss/deprel_loss: 0.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7722, loss: 0.7044, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 69%|######9 | 77/111 [00:53<00:23, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9465, LAS: 0.9015, UEM: 0.5902, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6163, partial_loss/deprel_loss: 0.5954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7734, loss: 0.7126, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||: 72%|#######2 | 80/111 [00:55<00:22, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9460, LAS: 0.9007, UEM: 0.5845, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9029, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9899, loss: 0.7188, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 76%|#######5 | 84/111 [00:58<00:18, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9461, LAS: 0.9008, UEM: 0.5894, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0194, partial_loss/deprel_loss: 0.7513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.7168, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 79%|#######9 | 88/111 [01:00<00:15, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9464, LAS: 0.9011, UEM: 0.5857, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6419, loss: 0.7150, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 82%|########1 | 91/111 [01:03<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9463, LAS: 0.9008, UEM: 0.5802, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7188, partial_loss/deprel_loss: 0.7382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7179, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 85%|########4 | 94/111 [01:05<00:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9464, LAS: 0.9009, UEM: 0.5844, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6178, loss: 0.7152, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 87%|########7 | 97/111 [01:07<00:10, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9463, LAS: 0.9008, UEM: 0.5848, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3774, partial_loss/deprel_loss: 0.5079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6556, loss: 0.7175, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 90%|######### | 100/111 [01:09<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9466, LAS: 0.9012, UEM: 0.5866, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2466, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7140, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 94%|#########3| 104/111 [01:12<00:05, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9466, LAS: 0.9010, UEM: 0.5883, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2192, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.7151, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 96%|#########6| 107/111 [01:14<00:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00, 1.44it/s]\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.610 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.533 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - reg_loss | 0.174 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UEM | 0.584 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LAS | 0.901 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - loss | 0.715 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEM | 0.354 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UAS | 0.947 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EM | 0.894 | N/A\n", + "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:28:45,380 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:28:50,593 - INFO - combo.training.trainer - Epoch duration: 0:01:25.821825\n", + "2023-04-07 00:28:50,594 - INFO - combo.training.trainer - Estimated training time remaining: 7:16:22\n", + "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Epoch 74/399\n", + "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:28:50,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:28:50,602 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9457, LAS: 0.8979, UEM: 0.4358, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4698, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.7372, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 4%|3 | 4/111 [00:02<01:04, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8997, UEM: 0.4974, LEM: 0.2300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4275, partial_loss/deprel_loss: 0.6147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7511, loss: 0.7173, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 6%|6 | 7/111 [00:04<01:06, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9457, LAS: 0.8984, UEM: 0.4551, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5032, partial_loss/deprel_loss: 0.5335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7012, loss: 0.7334, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 10%|9 | 11/111 [00:07<01:03, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9439, LAS: 0.8984, UEM: 0.4737, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5044, loss: 0.7341, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 13%|#2 | 14/111 [00:09<01:03, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9475, LAS: 0.9026, UEM: 0.5509, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4653, partial_loss/deprel_loss: 0.5485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.7058, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 16%|#6 | 18/111 [00:11<01:01, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9479, LAS: 0.9031, UEM: 0.5658, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1822, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.6988, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 20%|#9 | 22/111 [00:14<01:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9479, LAS: 0.9028, UEM: 0.5521, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5888, loss: 0.7014, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||: 23%|##2 | 25/111 [00:17<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9484, LAS: 0.9031, UEM: 0.5483, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3309, partial_loss/deprel_loss: 0.5004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.6986, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 25%|##5 | 28/111 [00:19<01:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9473, LAS: 0.9015, UEM: 0.5368, LEM: 0.3037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6838, partial_loss/deprel_loss: 0.6598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.7088, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 29%|##8 | 32/111 [00:21<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9485, LAS: 0.9027, UEM: 0.5627, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3361, partial_loss/deprel_loss: 0.4837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6279, loss: 0.7007, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 32%|###1 | 35/111 [00:24<00:53, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9499, LAS: 0.9039, UEM: 0.5790, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.4233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6914, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 34%|###4 | 38/111 [00:26<00:53, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8834, UAS: 0.9492, LAS: 0.9031, UEM: 0.5832, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.7277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8679, loss: 0.6963, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 37%|###6 | 41/111 [00:28<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9482, LAS: 0.9020, UEM: 0.5690, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8162, partial_loss/deprel_loss: 0.7002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8971, loss: 0.7059, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 40%|###9 | 44/111 [00:30<00:48, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9478, LAS: 0.9018, UEM: 0.5640, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2325, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.7076, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||: 43%|####3 | 48/111 [00:33<00:42, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9472, LAS: 0.9016, UEM: 0.5642, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2649, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.7090, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 47%|####6 | 52/111 [00:35<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9473, LAS: 0.9019, UEM: 0.5663, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.7079, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 50%|####9 | 55/111 [00:37<00:38, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9480, LAS: 0.9025, UEM: 0.5654, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.7046, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 52%|#####2 | 58/111 [00:40<00:37, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9475, LAS: 0.9022, UEM: 0.5687, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.7055, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 56%|#####5 | 62/111 [00:42<00:34, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9476, LAS: 0.9025, UEM: 0.6012, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1395, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4871, loss: 0.7037, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 59%|#####8 | 65/111 [00:45<00:33, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9469, LAS: 0.9016, UEM: 0.5897, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7124, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||: 62%|######2 | 69/111 [00:47<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9468, LAS: 0.9016, UEM: 0.5911, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4491, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1418, loss: 0.7127, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 66%|######5 | 73/111 [00:50<00:26, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9465, LAS: 0.9013, UEM: 0.5840, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7986, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9283, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 68%|######8 | 76/111 [00:52<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9460, LAS: 0.9008, UEM: 0.5814, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.7194, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 72%|#######2 | 80/111 [00:55<00:20, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9465, LAS: 0.9011, UEM: 0.5803, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 76%|#######5 | 84/111 [00:57<00:18, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9453, LAS: 0.8998, UEM: 0.5735, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7406, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3691, loss: 0.7262, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 78%|#######8 | 87/111 [01:00<00:16, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9462, LAS: 0.9008, UEM: 0.5816, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1876, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.7184, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 82%|########1 | 91/111 [01:02<00:13, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9458, LAS: 0.9004, UEM: 0.5796, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9515, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0319, loss: 0.7209, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 86%|########5 | 95/111 [01:05<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9462, LAS: 0.9009, UEM: 0.5865, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2142, partial_loss/deprel_loss: 0.3441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4918, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 88%|########8 | 98/111 [01:07<00:09, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9463, LAS: 0.9009, UEM: 0.5842, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3423, partial_loss/deprel_loss: 0.5043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6456, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 91%|######### | 101/111 [01:09<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9461, LAS: 0.9005, UEM: 0.5788, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9346, partial_loss/deprel_loss: 0.7656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.7180, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 95%|#########4| 105/111 [01:12<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9465, LAS: 0.9009, UEM: 0.5816, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7137, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 98%|#########8| 109/111 [01:15<00:01, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9469, LAS: 0.9013, UEM: 0.5879, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4319, partial_loss/deprel_loss: 0.4654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.7106, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.465 | N/A\n", + "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.432 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - reg_loss | 0.174 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UEM | 0.588 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LAS | 0.901 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - loss | 0.711 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEM | 0.351 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UAS | 0.947 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EM | 0.912 | N/A\n", + "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:30:10,477 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Epoch duration: 0:01:25.020714\n", + "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:22\n", + "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Epoch 75/399\n", + "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:30:15,626 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9491, LAS: 0.9042, UEM: 0.4891, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6299, partial_loss/deprel_loss: 0.6336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.7056, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||: 4%|3 | 4/111 [00:02<01:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9499, LAS: 0.9071, UEM: 0.4945, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3865, partial_loss/deprel_loss: 0.4271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.6799, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||: 6%|6 | 7/111 [00:04<01:07, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9516, LAS: 0.9080, UEM: 0.5327, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4005, partial_loss/deprel_loss: 0.5567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6990, loss: 0.6671, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||: 9%|9 | 10/111 [00:06<01:06, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9507, LAS: 0.9067, UEM: 0.5098, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4433, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6896, loss: 0.6811, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||: 12%|#1 | 13/111 [00:08<01:05, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9465, LAS: 0.9025, UEM: 0.4974, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9581, partial_loss/deprel_loss: 0.7562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9701, loss: 0.7203, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 15%|#5 | 17/111 [00:11<01:02, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9489, LAS: 0.9046, UEM: 0.5301, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2274, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5794, loss: 0.6991, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 19%|#8 | 21/111 [00:14<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9478, LAS: 0.9035, UEM: 0.5397, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5845, partial_loss/deprel_loss: 0.5930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 0.7022, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 22%|##1 | 24/111 [00:16<00:58, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9468, LAS: 0.9015, UEM: 0.5314, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2592, partial_loss/deprel_loss: 0.4407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7139, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 24%|##4 | 27/111 [00:18<00:58, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9464, LAS: 0.9007, UEM: 0.5205, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8469, partial_loss/deprel_loss: 0.7144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.7212, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 28%|##7 | 31/111 [00:20<00:54, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9458, LAS: 0.9003, UEM: 0.5028, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.5689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7708, loss: 0.7229, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 32%|###1 | 35/111 [00:23<00:49, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9465, LAS: 0.9008, UEM: 0.5095, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2651, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5487, loss: 0.7180, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 35%|###5 | 39/111 [00:25<00:46, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9450, LAS: 0.8992, UEM: 0.5146, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3986, partial_loss/deprel_loss: 0.8601, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.7268, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 39%|###8 | 43/111 [00:28<00:46, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9453, LAS: 0.8996, UEM: 0.5111, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7778, partial_loss/deprel_loss: 0.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8898, loss: 0.7258, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 42%|####2 | 47/111 [00:31<00:42, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9460, LAS: 0.9001, UEM: 0.5274, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.7209, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 45%|####5 | 50/111 [00:33<00:41, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9465, LAS: 0.9009, UEM: 0.5576, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4808, loss: 0.7148, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 48%|####7 | 53/111 [00:35<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9470, LAS: 0.9016, UEM: 0.5619, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4573, partial_loss/deprel_loss: 0.5106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6734, loss: 0.7086, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 50%|##### | 56/111 [00:38<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9478, LAS: 0.9026, UEM: 0.5709, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.7010, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||: 53%|#####3 | 59/111 [00:40<00:40, 1.29it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9478, LAS: 0.9028, UEM: 0.5694, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3711, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6245, loss: 0.6999, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 56%|#####5 | 62/111 [00:42<00:36, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9477, LAS: 0.9025, UEM: 0.5648, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9499, partial_loss/deprel_loss: 0.7206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9399, loss: 0.7035, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 59%|#####8 | 65/111 [00:44<00:33, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9478, LAS: 0.9026, UEM: 0.5617, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.7231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9010, loss: 0.7022, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 62%|######2 | 69/111 [00:47<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9464, LAS: 0.9012, UEM: 0.5578, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.7157, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 65%|######4 | 72/111 [00:49<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9469, LAS: 0.9017, UEM: 0.5644, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5945, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7529, loss: 0.7114, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 68%|######7 | 75/111 [00:51<00:25, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9467, LAS: 0.9014, UEM: 0.5578, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6574, partial_loss/deprel_loss: 0.6179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 0.7137, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 71%|#######1 | 79/111 [00:54<00:21, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9470, LAS: 0.9017, UEM: 0.5695, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5613, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.7098, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9473, LAS: 0.9019, UEM: 0.5681, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3195, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.7095, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 78%|#######8 | 87/111 [00:59<00:16, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9471, LAS: 0.9017, UEM: 0.5661, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.4737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.7102, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 82%|########1 | 91/111 [01:01<00:12, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9471, LAS: 0.9017, UEM: 0.5694, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3132, partial_loss/deprel_loss: 0.8401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1081, loss: 0.7094, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 86%|########5 | 95/111 [01:04<00:10, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9467, LAS: 0.9015, UEM: 0.5678, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4053, partial_loss/deprel_loss: 0.4962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7116, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 89%|########9 | 99/111 [01:07<00:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9472, LAS: 0.9019, UEM: 0.5759, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1922, partial_loss/deprel_loss: 0.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.7089, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||: 93%|#########2| 103/111 [01:10<00:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9472, LAS: 0.9020, UEM: 0.5894, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3455, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2516, loss: 0.7093, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||: 95%|#########5| 106/111 [01:12<00:03, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9473, LAS: 0.9022, UEM: 0.5902, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0149, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.7074, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||: 99%|#########9| 110/111 [01:14<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9474, LAS: 0.9022, UEM: 0.5892, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5141, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6635, loss: 0.7070, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||: 100%|##########| 111/111 [01:15<00:00, 1.47it/s]\n", + "2023-04-07 00:31:33,915 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9126, LAS: 0.8528, UEM: 0.2678, LEM: 0.0820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5891, partial_loss/deprel_loss: 57.0978, partial_loss/cycle_loss: 0.0000, batch_loss: 45.9961, loss: 35.5607, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9458, LAS: 0.8918, UEM: 0.6731, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4201, partial_loss/deprel_loss: 24.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9815, loss: 26.3380, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:08, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9447, LAS: 0.8922, UEM: 0.6285, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0363, partial_loss/deprel_loss: 36.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 29.4754, loss: 26.2771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9436, LAS: 0.8913, UEM: 0.6011, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5407, partial_loss/deprel_loss: 24.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6864, loss: 26.8626, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:09<00:02, 1.02it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9466, LAS: 0.8953, UEM: 0.6564, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1730, partial_loss/deprel_loss: 20.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3750, loss: 25.7702, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9464, LAS: 0.8949, UEM: 0.6475, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 34.6901, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8825, loss: 25.9327, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.04it/s]\n", + "2023-04-07 00:31:46,420 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.484 | 34.690\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.514 | 0.652\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | 0.000\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UEM | 0.589 | 0.648\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LAS | 0.902 | 0.895\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - loss | 0.707 | 25.933\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LEM | 0.354 | 0.382\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - UAS | 0.947 | 0.946\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EM | 0.907 | 0.890\n", + "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:31:46,427 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:31:51,593 - INFO - combo.training.trainer - Epoch duration: 0:01:35.977183\n", + "2023-04-07 00:31:51,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:08\n", + "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Epoch 76/399\n", + "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:31:51,596 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:31:51,605 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9347, LAS: 0.8909, UEM: 0.5095, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2675, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0746, loss: 0.7894, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 4%|3 | 4/111 [00:02<01:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9366, LAS: 0.8924, UEM: 0.3993, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 0.7514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 0.7899, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 7%|7 | 8/111 [00:05<01:05, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9376, LAS: 0.8935, UEM: 0.3859, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6642, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8321, loss: 0.7815, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 10%|9 | 11/111 [00:07<01:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9429, LAS: 0.8999, UEM: 0.5021, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.7301, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 13%|#2 | 14/111 [00:09<01:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9421, LAS: 0.8981, UEM: 0.4642, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5952, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7526, loss: 0.7337, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 16%|#6 | 18/111 [00:12<01:03, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9433, LAS: 0.8993, UEM: 0.4622, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7205, partial_loss/deprel_loss: 0.6275, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8194, loss: 0.7294, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 19%|#8 | 21/111 [00:14<01:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9412, LAS: 0.8971, UEM: 0.4414, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5751, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7429, loss: 0.7399, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 22%|##1 | 24/111 [00:16<00:59, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9438, LAS: 0.9003, UEM: 0.4829, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.7217, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 25%|##5 | 28/111 [00:18<00:53, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9451, LAS: 0.9016, UEM: 0.5168, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8150, loss: 0.7092, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 28%|##7 | 31/111 [00:20<00:56, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9432, LAS: 0.8997, UEM: 0.5206, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7606, partial_loss/deprel_loss: 0.6660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8582, loss: 0.7262, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 31%|### | 34/111 [00:23<00:55, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9443, LAS: 0.9008, UEM: 0.5325, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2798, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.7177, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 33%|###3 | 37/111 [00:25<00:52, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9462, LAS: 0.9029, UEM: 0.5708, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0746, partial_loss/deprel_loss: 0.1974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3461, loss: 0.7017, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 36%|###6 | 40/111 [00:27<00:49, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9462, LAS: 0.9027, UEM: 0.5641, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.7032, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 39%|###8 | 43/111 [00:29<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9468, LAS: 0.9032, UEM: 0.5601, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.6927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8361, loss: 0.7015, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||: 42%|####2 | 47/111 [00:32<00:44, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9467, LAS: 0.9027, UEM: 0.5492, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.7062, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 45%|####5 | 50/111 [00:34<00:41, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9462, LAS: 0.9021, UEM: 0.5426, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 0.7196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9672, loss: 0.7087, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 49%|####8 | 54/111 [00:36<00:37, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9460, LAS: 0.9020, UEM: 0.5445, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1289, partial_loss/deprel_loss: 0.2808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4237, loss: 0.7099, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 52%|#####2 | 58/111 [00:39<00:34, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9462, LAS: 0.9021, UEM: 0.5429, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7801, partial_loss/deprel_loss: 0.6634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8600, loss: 0.7097, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 56%|#####5 | 62/111 [00:42<00:33, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9451, LAS: 0.9010, UEM: 0.5357, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4855, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6469, loss: 0.7182, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 59%|#####8 | 65/111 [00:44<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9461, LAS: 0.9021, UEM: 0.5474, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.7102, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 61%|######1 | 68/111 [00:46<00:30, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9467, LAS: 0.9027, UEM: 0.5512, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.7054, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 65%|######4 | 72/111 [00:49<00:27, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9475, LAS: 0.9035, UEM: 0.5626, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5158, loss: 0.6985, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 68%|######7 | 75/111 [00:51<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9473, LAS: 0.9034, UEM: 0.5586, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.7342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9401, loss: 0.7008, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 72%|#######2 | 80/111 [00:53<00:19, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9467, LAS: 0.9025, UEM: 0.5626, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4381, loss: 0.7070, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 76%|#######5 | 84/111 [00:56<00:17, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9468, LAS: 0.9025, UEM: 0.5600, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7073, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 79%|#######9 | 88/111 [00:59<00:15, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9472, LAS: 0.9029, UEM: 0.5658, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.4354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7038, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||: 83%|########2 | 92/111 [01:02<00:13, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9040, UEM: 0.5924, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.6952, batch_reg_loss: 0.1732, reg_loss: 0.1732 ||: 86%|########5 | 95/111 [01:05<00:12, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9480, LAS: 0.9038, UEM: 0.5892, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 89%|########9 | 99/111 [01:07<00:08, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9482, LAS: 0.9040, UEM: 0.5977, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1306, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3963, loss: 0.6941, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 92%|#########1| 102/111 [01:10<00:06, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9480, LAS: 0.9038, UEM: 0.5968, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9104, partial_loss/deprel_loss: 0.7103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9235, loss: 0.6946, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 95%|#########4| 105/111 [01:12<00:04, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9480, LAS: 0.9037, UEM: 0.5927, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.6759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8316, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 98%|#########8| 109/111 [01:14<00:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9473, LAS: 0.9031, UEM: 0.5895, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4323, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1164, loss: 0.7008, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.821 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.432 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UEM | 0.590 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LAS | 0.903 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - loss | 0.701 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEM | 0.358 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - UAS | 0.947 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EM | 0.842 | N/A\n", + "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:33:10,837 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:33:15,301 - INFO - combo.training.trainer - Epoch duration: 0:01:23.706250\n", + "2023-04-07 00:33:15,302 - INFO - combo.training.trainer - Estimated training time remaining: 7:14:01\n", + "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Epoch 77/399\n", + "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:33:15,303 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:33:15,313 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9540, LAS: 0.9091, UEM: 0.4911, LEM: 0.2216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3272, partial_loss/deprel_loss: 0.4489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.6525, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 4%|3 | 4/111 [00:02<01:08, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9550, LAS: 0.9096, UEM: 0.5444, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1937, partial_loss/deprel_loss: 0.3571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.6352, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 6%|6 | 7/111 [00:04<01:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9568, LAS: 0.9127, UEM: 0.6099, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3553, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6122, loss: 0.6160, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 9%|9 | 10/111 [00:06<01:08, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9545, LAS: 0.9111, UEM: 0.5946, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4713, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.6297, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 12%|#1 | 13/111 [00:09<01:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9542, LAS: 0.9106, UEM: 0.5909, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5831, loss: 0.6357, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 14%|#4 | 16/111 [00:11<01:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9499, LAS: 0.9057, UEM: 0.5877, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7246, loss: 0.6704, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 17%|#7 | 19/111 [00:13<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9477, LAS: 0.9023, UEM: 0.5584, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7295, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8338, loss: 0.6924, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 20%|#9 | 22/111 [00:15<01:04, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9458, LAS: 0.9005, UEM: 0.5394, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6471, loss: 0.7056, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 23%|##2 | 25/111 [00:18<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9491, LAS: 0.9041, UEM: 0.5924, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6803, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 25%|##5 | 28/111 [00:20<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9486, LAS: 0.9040, UEM: 0.5864, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.6813, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 28%|##7 | 31/111 [00:22<00:56, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9480, LAS: 0.9034, UEM: 0.5770, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.6854, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||: 32%|###1 | 35/111 [00:24<00:52, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9487, LAS: 0.9038, UEM: 0.5780, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2471, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5682, loss: 0.6814, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 34%|###4 | 38/111 [00:26<00:50, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9490, LAS: 0.9041, UEM: 0.5731, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.6454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8054, loss: 0.6820, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 37%|###6 | 41/111 [00:29<00:49, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9507, LAS: 0.9061, UEM: 0.5970, LEM: 0.3520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2123, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.6680, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 40%|###9 | 44/111 [00:31<00:47, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9510, LAS: 0.9065, UEM: 0.5949, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5873, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6658, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 42%|####2 | 47/111 [00:33<00:46, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9517, LAS: 0.9072, UEM: 0.6124, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.6589, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 45%|####5 | 50/111 [00:35<00:45, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9508, LAS: 0.9060, UEM: 0.6017, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.5163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.6699, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 49%|####8 | 54/111 [00:38<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9505, LAS: 0.9062, UEM: 0.6242, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0425, partial_loss/deprel_loss: 0.1334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2883, loss: 0.6690, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 51%|#####1 | 57/111 [00:41<00:42, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9501, LAS: 0.9056, UEM: 0.6222, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.6729, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 55%|#####4 | 61/111 [00:43<00:36, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9498, LAS: 0.9051, UEM: 0.6129, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6639, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8237, loss: 0.6772, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 58%|#####7 | 64/111 [00:45<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9495, LAS: 0.9047, UEM: 0.6096, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.6809, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||: 60%|###### | 67/111 [00:48<00:32, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9498, LAS: 0.9050, UEM: 0.6106, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1373, partial_loss/deprel_loss: 0.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.6803, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 63%|######3 | 70/111 [00:50<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9489, LAS: 0.9041, UEM: 0.6022, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6463, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 66%|######5 | 73/111 [00:52<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9492, LAS: 0.9046, UEM: 0.6020, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3846, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6829, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 68%|######8 | 76/111 [00:54<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9493, LAS: 0.9047, UEM: 0.5995, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0225, partial_loss/deprel_loss: 0.7170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9511, loss: 0.6818, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 72%|#######2 | 80/111 [00:57<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9496, LAS: 0.9049, UEM: 0.5995, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.6812, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 75%|#######4 | 83/111 [00:59<00:20, 1.39it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9490, LAS: 0.9043, UEM: 0.5976, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9099, partial_loss/deprel_loss: 0.7320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9406, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||: 78%|#######8 | 87/111 [01:02<00:16, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9490, LAS: 0.9044, UEM: 0.5949, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.6859, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 81%|########1 | 90/111 [01:06<00:20, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9494, LAS: 0.9049, UEM: 0.6072, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0955, partial_loss/deprel_loss: 0.2082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3586, loss: 0.6819, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 84%|########3 | 93/111 [01:09<00:17, 1.06it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9491, LAS: 0.9046, UEM: 0.6034, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7977, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.6841, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 86%|########6 | 96/111 [01:11<00:13, 1.15it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9492, LAS: 0.9047, UEM: 0.6042, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4756, loss: 0.6822, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 89%|########9 | 99/111 [01:13<00:09, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9485, LAS: 0.9039, UEM: 0.5998, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6815, partial_loss/deprel_loss: 0.5970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7868, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 92%|#########1| 102/111 [01:15<00:07, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9487, LAS: 0.9040, UEM: 0.5997, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6866, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8256, loss: 0.6861, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 95%|#########4| 105/111 [01:18<00:04, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9485, LAS: 0.9037, UEM: 0.5933, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8087, partial_loss/deprel_loss: 0.8120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9843, loss: 0.6896, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 98%|#########8| 109/111 [01:20<00:01, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9480, LAS: 0.9032, UEM: 0.5896, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.6683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9109, loss: 0.6941, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 100%|##########| 111/111 [01:21<00:00, 1.35it/s]\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.668 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 1.017 | N/A\n", + "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UEM | 0.590 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LAS | 0.903 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - loss | 0.694 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEM | 0.359 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UAS | 0.948 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EM | 0.875 | N/A\n", + "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:34:40,196 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:34:44,979 - INFO - combo.training.trainer - Epoch duration: 0:01:29.676969\n", + "2023-04-07 00:34:44,980 - INFO - combo.training.trainer - Estimated training time remaining: 7:13:18\n", + "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Epoch 78/399\n", + "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:34:44,981 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:34:44,988 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9679, LAS: 0.9231, UEM: 0.7181, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.3727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.5293, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 3%|2 | 3/111 [00:02<01:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9566, LAS: 0.9133, UEM: 0.6358, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.6221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.6167, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 5%|5 | 6/111 [00:04<01:13, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9543, LAS: 0.9101, UEM: 0.6182, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3246, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9486, LAS: 0.9035, UEM: 0.5601, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.6585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8727, loss: 0.6916, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 12%|#1 | 13/111 [00:08<01:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9496, LAS: 0.9042, UEM: 0.5650, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5894, partial_loss/deprel_loss: 0.5549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.6833, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 14%|#4 | 16/111 [00:11<01:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9507, LAS: 0.9051, UEM: 0.5807, LEM: 0.3174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5727, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7888, loss: 0.6759, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 17%|#7 | 19/111 [00:13<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9504, LAS: 0.9054, UEM: 0.5797, LEM: 0.3181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5428, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7111, loss: 0.6827, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 20%|#9 | 22/111 [00:15<01:05, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9482, LAS: 0.9033, UEM: 0.5805, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2453, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1083, loss: 0.6936, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 23%|##2 | 25/111 [00:17<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9480, LAS: 0.9034, UEM: 0.5686, LEM: 0.3231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7153, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7766, loss: 0.6925, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 25%|##5 | 28/111 [00:20<01:03, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9483, LAS: 0.9041, UEM: 0.5652, LEM: 0.3186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5495, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 28%|##7 | 31/111 [00:22<01:02, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9485, LAS: 0.9044, UEM: 0.5621, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0274, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0280, loss: 0.6880, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 32%|###1 | 35/111 [00:25<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9465, LAS: 0.9023, UEM: 0.5479, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8060, partial_loss/deprel_loss: 0.7816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9593, loss: 0.7045, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 35%|###5 | 39/111 [00:27<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9456, LAS: 0.9013, UEM: 0.5402, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5544, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7852, loss: 0.7115, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 38%|###7 | 42/111 [00:29<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9461, LAS: 0.9019, UEM: 0.5449, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7151, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8796, loss: 0.7092, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 41%|#### | 45/111 [00:31<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9474, LAS: 0.9031, UEM: 0.5644, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.6419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.7012, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 43%|####3 | 48/111 [00:34<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9469, LAS: 0.9025, UEM: 0.5606, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8224, partial_loss/deprel_loss: 0.6433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8520, loss: 0.7051, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 47%|####6 | 52/111 [00:36<00:40, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9475, LAS: 0.9031, UEM: 0.5585, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2593, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.7007, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||: 50%|####9 | 55/111 [00:38<00:39, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9470, LAS: 0.9024, UEM: 0.5479, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4642, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7049, loss: 0.7073, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 53%|#####3 | 59/111 [00:41<00:34, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9475, LAS: 0.9030, UEM: 0.5552, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4942, partial_loss/deprel_loss: 0.5451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7077, loss: 0.7039, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 57%|#####6 | 63/111 [00:43<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9472, LAS: 0.9028, UEM: 0.5517, LEM: 0.3139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3959, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.7036, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 60%|###### | 67/111 [00:46<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9478, LAS: 0.9035, UEM: 0.5566, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2160, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5036, loss: 0.6997, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 64%|######3 | 71/111 [00:49<00:27, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9476, LAS: 0.9032, UEM: 0.5699, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0714, partial_loss/deprel_loss: 0.2042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7030, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 67%|######6 | 74/111 [00:51<00:25, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9465, LAS: 0.9023, UEM: 0.5679, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8180, partial_loss/deprel_loss: 0.6136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.7098, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 69%|######9 | 77/111 [00:54<00:24, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9465, LAS: 0.9021, UEM: 0.5639, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6078, partial_loss/deprel_loss: 0.6108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7830, loss: 0.7105, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 73%|#######2 | 81/111 [00:56<00:21, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9470, LAS: 0.9028, UEM: 0.5722, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1430, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4033, loss: 0.7049, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 76%|#######5 | 84/111 [00:58<00:19, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9474, LAS: 0.9034, UEM: 0.5887, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6315, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7844, loss: 0.6999, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 78%|#######8 | 87/111 [01:01<00:17, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9481, LAS: 0.9040, UEM: 0.5977, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6947, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 81%|########1 | 90/111 [01:03<00:15, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9479, LAS: 0.9036, UEM: 0.5902, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6856, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6968, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 85%|########4 | 94/111 [01:06<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9479, LAS: 0.9038, UEM: 0.5882, LEM: 0.3587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3477, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6485, loss: 0.6960, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 87%|########7 | 97/111 [01:08<00:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9475, LAS: 0.9035, UEM: 0.5840, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6664, partial_loss/deprel_loss: 0.5377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7362, loss: 0.6976, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 90%|######### | 100/111 [01:10<00:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9480, LAS: 0.9041, UEM: 0.5887, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.6932, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||: 94%|#########3| 104/111 [01:13<00:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9486, LAS: 0.9047, UEM: 0.5946, LEM: 0.3647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2394, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6893, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||: 96%|#########6| 107/111 [01:15<00:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9489, LAS: 0.9049, UEM: 0.5942, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6411, partial_loss/deprel_loss: 0.6306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8055, loss: 0.6882, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||: 99%|#########9| 110/111 [01:17<00:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9489, LAS: 0.9048, UEM: 0.5932, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.6202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7615, loss: 0.6888, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||: 100%|##########| 111/111 [01:18<00:00, 1.42it/s]\n", + "2023-04-07 00:36:06,576 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.620 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.463 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UEM | 0.593 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - LAS | 0.905 | N/A\n", + "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - loss | 0.689 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEM | 0.362 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - UAS | 0.949 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EM | 0.898 | N/A\n", + "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:36:06,583 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:36:11,692 - INFO - combo.training.trainer - Epoch duration: 0:01:26.712266\n", + "2023-04-07 00:36:11,693 - INFO - combo.training.trainer - Estimated training time remaining: 7:12:21\n", + "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Epoch 79/399\n", + "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:36:11,701 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9567, LAS: 0.9180, UEM: 0.5695, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2451, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 0.6235, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 4%|3 | 4/111 [00:02<01:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8239, UAS: 0.9426, LAS: 0.9010, UEM: 0.4922, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.0595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3627, loss: 0.7478, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 7%|7 | 8/111 [00:05<01:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9500, LAS: 0.9082, UEM: 0.6338, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6534, loss: 0.6912, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 10%|9 | 11/111 [00:07<01:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9476, LAS: 0.9051, UEM: 0.5838, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.4990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7086, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 14%|#3 | 15/111 [00:10<01:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9468, LAS: 0.9040, UEM: 0.5621, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3119, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7126, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 16%|#6 | 18/111 [00:12<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9495, LAS: 0.9071, UEM: 0.6012, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4632, loss: 0.6835, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 19%|#8 | 21/111 [00:14<01:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9512, LAS: 0.9097, UEM: 0.6573, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7300, partial_loss/deprel_loss: 0.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8295, loss: 0.6655, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 22%|##1 | 24/111 [00:16<01:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9509, LAS: 0.9091, UEM: 0.6380, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.6719, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 25%|##5 | 28/111 [00:19<00:57, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9527, LAS: 0.9108, UEM: 0.6429, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2971, partial_loss/deprel_loss: 0.4320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.6572, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 29%|##8 | 32/111 [00:21<00:51, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9526, LAS: 0.9103, UEM: 0.6318, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3001, partial_loss/deprel_loss: 0.4517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6554, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 32%|###1 | 35/111 [00:23<00:50, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8422, UAS: 0.9514, LAS: 0.9086, UEM: 0.6262, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2311, partial_loss/deprel_loss: 0.8674, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1128, loss: 0.6664, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 34%|###4 | 38/111 [00:25<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9524, LAS: 0.9097, UEM: 0.6317, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5211, loss: 0.6570, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||: 37%|###6 | 41/111 [00:27<00:48, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9507, LAS: 0.9078, UEM: 0.6229, LEM: 0.4022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1997, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4966, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 41%|#### | 45/111 [00:30<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9501, LAS: 0.9073, UEM: 0.6259, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1513, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4078, loss: 0.6734, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 44%|####4 | 49/111 [00:33<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9506, LAS: 0.9077, UEM: 0.6257, LEM: 0.4059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5370, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7598, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 47%|####6 | 52/111 [00:35<00:41, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9509, LAS: 0.9082, UEM: 0.6271, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4542, loss: 0.6671, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 50%|##### | 56/111 [00:38<00:38, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9504, LAS: 0.9075, UEM: 0.6145, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 0.5008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.6702, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 54%|#####4 | 60/111 [00:40<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9511, LAS: 0.9083, UEM: 0.6169, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.6644, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 58%|#####7 | 64/111 [00:43<00:32, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9515, LAS: 0.9084, UEM: 0.6153, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2341, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.6629, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 60%|###### | 67/111 [00:45<00:30, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9511, LAS: 0.9079, UEM: 0.6110, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8882, partial_loss/deprel_loss: 0.7016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9115, loss: 0.6672, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 63%|######3 | 70/111 [00:48<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9509, LAS: 0.9078, UEM: 0.6095, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.6690, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 66%|######5 | 73/111 [00:50<00:27, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9505, LAS: 0.9071, UEM: 0.6078, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.6730, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 69%|######9 | 77/111 [00:52<00:23, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9508, LAS: 0.9073, UEM: 0.6133, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1380, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.6704, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 72%|#######2 | 80/111 [00:54<00:21, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9498, LAS: 0.9063, UEM: 0.6056, LEM: 0.3753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5038, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2339, loss: 0.6799, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||: 76%|#######5 | 84/111 [00:57<00:18, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9499, LAS: 0.9062, UEM: 0.6077, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6644, partial_loss/deprel_loss: 0.6769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8469, loss: 0.6789, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 78%|#######8 | 87/111 [00:59<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9496, LAS: 0.9058, UEM: 0.6070, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7890, partial_loss/deprel_loss: 0.8387, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0013, loss: 0.6827, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 81%|########1 | 90/111 [01:01<00:14, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9486, LAS: 0.9046, UEM: 0.5989, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4162, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6961, loss: 0.6908, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 85%|########4 | 94/111 [01:04<00:11, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9480, LAS: 0.9039, UEM: 0.5931, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6230, partial_loss/deprel_loss: 0.6034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6954, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 88%|########8 | 98/111 [01:07<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9481, LAS: 0.9041, UEM: 0.5966, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8358, partial_loss/deprel_loss: 0.7337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9267, loss: 0.6936, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 91%|######### | 101/111 [01:09<00:07, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9480, LAS: 0.9040, UEM: 0.5914, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4340, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.6934, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 95%|#########4| 105/111 [01:11<00:04, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9478, LAS: 0.9037, UEM: 0.5856, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8297, partial_loss/deprel_loss: 0.6664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8716, loss: 0.6959, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 98%|#########8| 109/111 [01:14<00:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9479, LAS: 0.9038, UEM: 0.5869, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7285, partial_loss/deprel_loss: 0.5894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7897, loss: 0.6951, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-07 00:37:30,881 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.589 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.729 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - reg_loss | 0.173 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UEM | 0.587 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LAS | 0.904 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - loss | 0.695 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LEM | 0.360 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - UAS | 0.948 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EM | 0.889 | N/A\n", + "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:37:30,890 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Epoch duration: 0:01:25.198854\n", + "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:18\n", + "2023-04-07 00:37:36,892 - INFO - allennlp.training.trainer - Epoch 80/399\n", + "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:37:36,903 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9620, LAS: 0.9237, UEM: 0.6907, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.5313, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9603, LAS: 0.9177, UEM: 0.6303, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4412, partial_loss/deprel_loss: 0.5262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.5811, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 5%|5 | 6/111 [00:04<01:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9588, LAS: 0.9181, UEM: 0.6741, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7152, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 0.5944, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 8%|8 | 9/111 [00:06<01:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9549, LAS: 0.9129, UEM: 0.6113, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6329, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 12%|#1 | 13/111 [00:09<01:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9546, LAS: 0.9125, UEM: 0.6094, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4229, partial_loss/deprel_loss: 0.4221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6348, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 14%|#4 | 16/111 [00:11<01:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9532, LAS: 0.9108, UEM: 0.6202, LEM: 0.4140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9059, partial_loss/deprel_loss: 0.7547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9574, loss: 0.6489, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 17%|#7 | 19/111 [00:13<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9530, LAS: 0.9100, UEM: 0.6040, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3067, partial_loss/deprel_loss: 0.4951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.6532, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 20%|#9 | 22/111 [00:15<01:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9490, LAS: 0.9057, UEM: 0.5830, LEM: 0.3724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4699, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7044, loss: 0.6857, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 23%|##2 | 25/111 [00:18<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9502, LAS: 0.9070, UEM: 0.5930, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2599, partial_loss/deprel_loss: 0.4180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5588, loss: 0.6773, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 26%|##6 | 29/111 [00:20<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9518, LAS: 0.9092, UEM: 0.6273, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2288, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6576, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||: 29%|##8 | 32/111 [00:23<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9495, LAS: 0.9065, UEM: 0.6101, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6791, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 32%|###1 | 35/111 [00:25<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9486, LAS: 0.9054, UEM: 0.6030, LEM: 0.3847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5379, partial_loss/deprel_loss: 0.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7500, loss: 0.6869, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 34%|###4 | 38/111 [00:27<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.9468, LAS: 0.9033, UEM: 0.5977, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7654, partial_loss/deprel_loss: 0.9535, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2883, loss: 0.7037, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 37%|###6 | 41/111 [00:29<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9469, LAS: 0.9034, UEM: 0.5872, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5514, loss: 0.7030, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 41%|#### | 45/111 [00:31<00:44, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9462, LAS: 0.9022, UEM: 0.5714, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5592, partial_loss/deprel_loss: 0.6000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7643, loss: 0.7125, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 44%|####4 | 49/111 [00:34<00:40, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9474, LAS: 0.9035, UEM: 0.5757, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.7029, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 48%|####7 | 53/111 [00:37<00:41, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9485, LAS: 0.9047, UEM: 0.5836, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6956, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 50%|##### | 56/111 [00:39<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9483, LAS: 0.9043, UEM: 0.5866, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4921, loss: 0.6978, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 53%|#####3 | 59/111 [00:41<00:36, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9490, LAS: 0.9051, UEM: 0.5953, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2126, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4870, loss: 0.6900, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 56%|#####5 | 62/111 [00:44<00:37, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9492, LAS: 0.9052, UEM: 0.5994, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2119, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5176, loss: 0.6883, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 59%|#####8 | 65/111 [00:46<00:34, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9495, LAS: 0.9056, UEM: 0.6049, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1288, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.6860, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 61%|######1 | 68/111 [00:48<00:31, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9491, LAS: 0.9052, UEM: 0.6076, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 0.7577, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0465, loss: 0.6871, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 64%|######3 | 71/111 [00:50<00:29, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9494, LAS: 0.9057, UEM: 0.6087, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.4091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5593, loss: 0.6846, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||: 67%|######6 | 74/111 [00:53<00:27, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9496, LAS: 0.9057, UEM: 0.6040, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3739, partial_loss/deprel_loss: 0.5073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6851, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 70%|####### | 78/111 [00:55<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9496, LAS: 0.9056, UEM: 0.6007, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6847, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 74%|#######3 | 82/111 [00:57<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9495, LAS: 0.9057, UEM: 0.5956, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4589, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6845, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 77%|#######6 | 85/111 [01:00<00:18, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9495, LAS: 0.9056, UEM: 0.5939, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6853, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||: 80%|######## | 89/111 [01:02<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9491, LAS: 0.9052, UEM: 0.5858, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7029, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7993, loss: 0.6869, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 84%|########3 | 93/111 [01:05<00:11, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9482, LAS: 0.9041, UEM: 0.5799, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9657, partial_loss/deprel_loss: 0.7077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9316, loss: 0.6950, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 87%|########7 | 97/111 [01:07<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9480, LAS: 0.9037, UEM: 0.5733, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5950, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7570, loss: 0.6973, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 91%|######### | 101/111 [01:10<00:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9483, LAS: 0.9039, UEM: 0.5756, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7691, loss: 0.6958, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 95%|#########4| 105/111 [01:13<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9485, LAS: 0.9043, UEM: 0.5833, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4842, loss: 0.6930, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 97%|#########7| 108/111 [01:15<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00, 1.43it/s]\n", + "2023-04-07 00:38:57,543 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9029, LAS: 0.8477, UEM: 0.1151, LEM: 0.0144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3311, partial_loss/deprel_loss: 47.7680, partial_loss/cycle_loss: 0.0000, batch_loss: 38.4806, loss: 41.8893, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.09s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9320, LAS: 0.8765, UEM: 0.5111, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 24.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 19.4517, loss: 30.7239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:05<00:08, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9407, LAS: 0.8871, UEM: 0.6027, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 23.6009, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9157, loss: 28.3449, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:05, 1.01s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9430, LAS: 0.8909, UEM: 0.5963, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 17.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 14.0323, loss: 26.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9458, LAS: 0.8946, UEM: 0.6489, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7757, partial_loss/deprel_loss: 29.8046, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9988, loss: 25.6342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.06it/s]\n", + "2023-04-07 00:39:09,770 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.672 | 29.805\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.732 | 0.776\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | 0.000\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - UEM | 0.595 | 0.649\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LAS | 0.904 | 0.895\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - loss | 0.691 | 25.634\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEM | 0.365 | 0.386\n", + "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - UAS | 0.949 | 0.946\n", + "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EM | 0.875 | 0.881\n", + "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:39:09,780 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:39:14,857 - INFO - combo.training.trainer - Epoch duration: 0:01:37.964569\n", + "2023-04-07 00:39:14,858 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:04\n", + "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Epoch 81/399\n", + "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:39:14,859 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:39:14,868 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9547, LAS: 0.9104, UEM: 0.6792, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7273, loss: 0.6154, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 3%|2 | 3/111 [00:02<01:14, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9549, LAS: 0.9128, UEM: 0.7015, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2751, partial_loss/deprel_loss: 0.3782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.6082, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 6%|6 | 7/111 [00:04<01:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9524, LAS: 0.9107, UEM: 0.6876, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6333, partial_loss/deprel_loss: 0.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7808, loss: 0.6312, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 9%|9 | 10/111 [00:06<01:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9514, LAS: 0.9102, UEM: 0.6589, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.6450, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 12%|#1 | 13/111 [00:08<01:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9522, LAS: 0.9101, UEM: 0.6362, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.6486, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 14%|#4 | 16/111 [00:11<01:10, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9496, LAS: 0.9079, UEM: 0.6037, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4495, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6475, loss: 0.6674, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 17%|#7 | 19/111 [00:13<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9513, LAS: 0.9092, UEM: 0.6182, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2502, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5469, loss: 0.6559, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 20%|#9 | 22/111 [00:15<01:05, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9502, LAS: 0.9075, UEM: 0.6075, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1735, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4646, loss: 0.6651, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 23%|##2 | 25/111 [00:17<01:02, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9510, LAS: 0.9083, UEM: 0.6091, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1998, partial_loss/deprel_loss: 0.3217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4696, loss: 0.6594, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 25%|##5 | 28/111 [00:20<01:01, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9499, LAS: 0.9070, UEM: 0.6042, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2352, partial_loss/deprel_loss: 0.7932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0539, loss: 0.6675, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 28%|##7 | 31/111 [00:22<00:59, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9509, LAS: 0.9084, UEM: 0.6005, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3909, partial_loss/deprel_loss: 0.4168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.6564, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 32%|###1 | 35/111 [00:25<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9528, LAS: 0.9105, UEM: 0.6227, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2360, partial_loss/deprel_loss: 0.3608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.6427, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 34%|###4 | 38/111 [00:27<00:52, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9514, LAS: 0.9089, UEM: 0.6216, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4446, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6127, loss: 0.6547, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||: 37%|###6 | 41/111 [00:29<00:50, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9518, LAS: 0.9095, UEM: 0.6119, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4576, partial_loss/deprel_loss: 0.4736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.6515, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 41%|#### | 45/111 [00:31<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9508, LAS: 0.9086, UEM: 0.6184, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4012, loss: 0.6600, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 43%|####3 | 48/111 [00:34<00:45, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9505, LAS: 0.9082, UEM: 0.6075, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6638, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 46%|####5 | 51/111 [00:36<00:44, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9509, LAS: 0.9087, UEM: 0.6097, LEM: 0.3735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.6610, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 49%|####8 | 54/111 [00:38<00:42, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9501, LAS: 0.9077, UEM: 0.6038, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0205, partial_loss/deprel_loss: 0.7639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9874, loss: 0.6706, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 51%|#####1 | 57/111 [00:41<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9498, LAS: 0.9072, UEM: 0.5953, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6021, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6743, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 55%|#####4 | 61/111 [00:43<00:35, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9496, LAS: 0.9071, UEM: 0.5866, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5802, loss: 0.6753, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 59%|#####8 | 65/111 [00:46<00:31, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9505, LAS: 0.9079, UEM: 0.5911, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2425, partial_loss/deprel_loss: 0.4279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.6692, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 62%|######2 | 69/111 [00:49<00:29, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9508, LAS: 0.9080, UEM: 0.5965, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1185, partial_loss/deprel_loss: 0.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.6676, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 66%|######5 | 73/111 [00:51<00:26, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9508, LAS: 0.9081, UEM: 0.6005, LEM: 0.3605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6657, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 68%|######8 | 76/111 [00:54<00:26, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9501, LAS: 0.9073, UEM: 0.5916, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7469, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8567, loss: 0.6726, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||: 71%|#######1 | 79/111 [00:56<00:23, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9500, LAS: 0.9070, UEM: 0.5944, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3228, partial_loss/deprel_loss: 0.8789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.6744, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 75%|#######4 | 83/111 [00:59<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9497, LAS: 0.9067, UEM: 0.5907, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.6763, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 78%|#######8 | 87/111 [01:01<00:16, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9492, LAS: 0.9060, UEM: 0.5841, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6835, partial_loss/deprel_loss: 0.5940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7840, loss: 0.6808, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 81%|########1 | 90/111 [01:03<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9490, LAS: 0.9058, UEM: 0.5808, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8498, loss: 0.6830, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 84%|########3 | 93/111 [01:05<00:12, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9491, LAS: 0.9058, UEM: 0.5772, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.6745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8483, loss: 0.6848, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 87%|########7 | 97/111 [01:08<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9499, LAS: 0.9066, UEM: 0.5916, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2769, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6777, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||: 91%|######### | 101/111 [01:11<00:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9636, UAS: 0.9495, LAS: 0.9062, UEM: 0.6024, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0667, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3005, loss: 0.6809, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 94%|#########3| 104/111 [01:13<00:05, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9497, LAS: 0.9063, UEM: 0.6006, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6036, loss: 0.6805, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 96%|#########6| 107/111 [01:16<00:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9496, LAS: 0.9061, UEM: 0.5974, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.6823, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 99%|#########9| 110/111 [01:18<00:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9495, LAS: 0.9060, UEM: 0.5958, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.6830, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 100%|##########| 111/111 [01:18<00:00, 1.41it/s]\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.598 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.526 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UEM | 0.596 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LAS | 0.906 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - loss | 0.683 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEM | 0.366 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EM | 0.895 | N/A\n", + "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:40:37,041 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Epoch duration: 0:01:27.026083\n", + "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Estimated training time remaining: 7:10:06\n", + "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Epoch 82/399\n", + "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:40:41,894 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9409, LAS: 0.8998, UEM: 0.4771, LEM: 0.2604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0136, partial_loss/deprel_loss: 0.6579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9012, loss: 0.7123, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 4%|3 | 4/111 [00:02<01:10, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9483, LAS: 0.9083, UEM: 0.6919, LEM: 0.5363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.6607, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 6%|6 | 7/111 [00:05<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9542, LAS: 0.9138, UEM: 0.7011, LEM: 0.4979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6391, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.6194, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 10%|9 | 11/111 [00:07<01:08, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9534, LAS: 0.9131, UEM: 0.6858, LEM: 0.4754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4420, partial_loss/deprel_loss: 0.4731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.6224, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 13%|#2 | 14/111 [00:09<01:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9539, LAS: 0.9126, UEM: 0.6711, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6797, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.6269, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 16%|#6 | 18/111 [00:12<01:01, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9545, LAS: 0.9128, UEM: 0.6608, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3726, partial_loss/deprel_loss: 0.5161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6595, loss: 0.6252, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 19%|#8 | 21/111 [00:14<01:00, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9565, LAS: 0.9145, UEM: 0.6808, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4160, partial_loss/deprel_loss: 0.5045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.6114, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 22%|##1 | 24/111 [00:16<01:01, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9542, LAS: 0.9119, UEM: 0.6572, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7963, loss: 0.6330, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 24%|##4 | 27/111 [00:18<00:58, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9553, LAS: 0.9132, UEM: 0.6573, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2071, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.6242, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 28%|##7 | 31/111 [00:21<00:56, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9533, LAS: 0.9109, UEM: 0.6456, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1913, partial_loss/deprel_loss: 0.8398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.6427, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 31%|### | 34/111 [00:23<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9520, LAS: 0.9095, UEM: 0.6338, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0930, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9448, loss: 0.6531, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 33%|###3 | 37/111 [00:25<00:52, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9523, LAS: 0.9097, UEM: 0.6358, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1727, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4593, loss: 0.6540, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||: 37%|###6 | 41/111 [00:28<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9517, LAS: 0.9092, UEM: 0.6257, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2168, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.6588, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 41%|#### | 45/111 [00:30<00:42, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9508, LAS: 0.9081, UEM: 0.6245, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4910, partial_loss/deprel_loss: 0.5458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7069, loss: 0.6681, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 44%|####4 | 49/111 [00:33<00:40, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9501, LAS: 0.9071, UEM: 0.6120, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8077, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.6766, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 48%|####7 | 53/111 [00:35<00:39, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9507, LAS: 0.9076, UEM: 0.6135, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2720, partial_loss/deprel_loss: 0.4549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5904, loss: 0.6743, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 50%|##### | 56/111 [00:38<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9502, LAS: 0.9071, UEM: 0.5999, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6217, partial_loss/deprel_loss: 0.5910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6763, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 54%|#####4 | 60/111 [00:40<00:34, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9502, LAS: 0.9069, UEM: 0.5913, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5812, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7507, loss: 0.6767, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9498, LAS: 0.9065, UEM: 0.5906, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.6800, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 60%|###### | 67/111 [00:46<00:32, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9500, LAS: 0.9065, UEM: 0.5908, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2326, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 63%|######3 | 70/111 [00:48<00:30, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9501, LAS: 0.9067, UEM: 0.5942, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.6856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9006, loss: 0.6772, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 66%|######5 | 73/111 [00:50<00:28, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9502, LAS: 0.9067, UEM: 0.5941, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4790, loss: 0.6774, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 68%|######8 | 76/111 [00:52<00:26, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9507, LAS: 0.9072, UEM: 0.6020, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3602, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.6746, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 72%|#######2 | 80/111 [00:55<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9504, LAS: 0.9068, UEM: 0.5954, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7883, partial_loss/deprel_loss: 0.6437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8446, loss: 0.6771, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 75%|#######4 | 83/111 [00:57<00:19, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9504, LAS: 0.9068, UEM: 0.5946, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6778, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 77%|#######7 | 86/111 [00:59<00:17, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9503, LAS: 0.9066, UEM: 0.5921, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3417, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 80%|######## | 89/111 [01:01<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9502, LAS: 0.9063, UEM: 0.5880, LEM: 0.3507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7008, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7791, loss: 0.6807, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 83%|########2 | 92/111 [01:03<00:13, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9504, LAS: 0.9067, UEM: 0.5963, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.6775, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 86%|########5 | 95/111 [01:06<00:11, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9498, LAS: 0.9059, UEM: 0.5917, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5857, loss: 0.6827, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 89%|########9 | 99/111 [01:08<00:08, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9501, LAS: 0.9062, UEM: 0.5957, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.4081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5498, loss: 0.6808, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||: 92%|#########1| 102/111 [01:10<00:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9501, LAS: 0.9062, UEM: 0.5980, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4289, loss: 0.6796, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 95%|#########5| 106/111 [01:13<00:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9505, LAS: 0.9066, UEM: 0.6012, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6757, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 98%|#########8| 109/111 [01:15<00:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9500, LAS: 0.9062, UEM: 0.5992, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.4593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6101, loss: 0.6789, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 100%|##########| 111/111 [01:17<00:00, 1.44it/s]\n", + "2023-04-07 00:42:02,217 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.459 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.354 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UEM | 0.599 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - LAS | 0.906 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - loss | 0.679 | N/A\n", + "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEM | 0.363 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EM | 0.915 | N/A\n", + "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:42:02,224 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:42:07,283 - INFO - combo.training.trainer - Epoch duration: 0:01:25.398504\n", + "2023-04-07 00:42:07,284 - INFO - combo.training.trainer - Estimated training time remaining: 7:09:01\n", + "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Epoch 83/399\n", + "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:42:07,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:42:07,294 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9284, LAS: 0.8837, UEM: 0.1775, LEM: 0.0476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6096, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.8763, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 3%|2 | 3/111 [00:02<01:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9434, LAS: 0.8991, UEM: 0.5232, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5829, loss: 0.7464, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 5%|5 | 6/111 [00:04<01:14, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9472, LAS: 0.9040, UEM: 0.5188, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.7046, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 9%|9 | 10/111 [00:06<01:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9509, LAS: 0.9083, UEM: 0.5943, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7866, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6678, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 13%|#2 | 14/111 [00:09<01:03, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9491, LAS: 0.9066, UEM: 0.5690, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4959, partial_loss/deprel_loss: 0.5747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7309, loss: 0.6766, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||: 15%|#5 | 17/111 [00:11<01:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9483, LAS: 0.9054, UEM: 0.5519, LEM: 0.3169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7224, partial_loss/deprel_loss: 0.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8426, loss: 0.6896, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||: 19%|#8 | 21/111 [00:13<00:58, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9476, LAS: 0.9052, UEM: 0.5393, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3746, partial_loss/deprel_loss: 0.7047, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0106, loss: 0.6951, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||: 23%|##3 | 26/111 [00:15<00:50, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9492, LAS: 0.9067, UEM: 0.6104, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.6811, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 27%|##7 | 30/111 [00:18<00:47, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9487, LAS: 0.9066, UEM: 0.5992, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8356, loss: 0.6787, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 31%|### | 34/111 [00:20<00:46, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9484, LAS: 0.9060, UEM: 0.5845, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.6451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8301, loss: 0.6820, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 34%|###4 | 38/111 [00:23<00:43, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9472, LAS: 0.9040, UEM: 0.5775, LEM: 0.3495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.6965, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 38%|###7 | 42/111 [00:25<00:42, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.9025, UEM: 0.5688, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5569, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7552, loss: 0.7069, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 41%|####1 | 46/111 [00:28<00:42, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9474, LAS: 0.9046, UEM: 0.6034, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6915, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 45%|####5 | 50/111 [00:31<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9489, LAS: 0.9062, UEM: 0.6256, LEM: 0.4053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1323, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4189, loss: 0.6783, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 48%|####7 | 53/111 [00:34<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9494, LAS: 0.9068, UEM: 0.6231, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6730, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 51%|#####1 | 57/111 [00:36<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9496, LAS: 0.9068, UEM: 0.6177, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.6716, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 55%|#####4 | 61/111 [00:39<00:34, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9496, LAS: 0.9068, UEM: 0.6141, LEM: 0.3893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5248, loss: 0.6721, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 58%|#####7 | 64/111 [00:41<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9504, LAS: 0.9075, UEM: 0.6194, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2091, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5151, loss: 0.6667, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 60%|###### | 67/111 [00:44<00:33, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9505, LAS: 0.9076, UEM: 0.6181, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6354, loss: 0.6657, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 63%|######3 | 70/111 [00:46<00:30, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9504, LAS: 0.9074, UEM: 0.6133, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7722, partial_loss/deprel_loss: 0.6533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8489, loss: 0.6670, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 66%|######5 | 73/111 [00:48<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9505, LAS: 0.9074, UEM: 0.6114, LEM: 0.3800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9190, partial_loss/deprel_loss: 0.6907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.6686, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 68%|######8 | 76/111 [00:50<00:25, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9506, LAS: 0.9075, UEM: 0.6083, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.6687, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||: 72%|#######2 | 80/111 [00:53<00:22, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9507, LAS: 0.9076, UEM: 0.6118, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1026, partial_loss/deprel_loss: 0.2484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.6690, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 76%|#######5 | 84/111 [00:56<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9502, LAS: 0.9070, UEM: 0.6113, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.6126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8212, loss: 0.6721, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 78%|#######8 | 87/111 [00:58<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9498, LAS: 0.9066, UEM: 0.6044, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6229, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7368, loss: 0.6750, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 81%|########1 | 90/111 [01:00<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9495, LAS: 0.9063, UEM: 0.6002, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6756, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8084, loss: 0.6786, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 84%|########3 | 93/111 [01:02<00:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9491, LAS: 0.9058, UEM: 0.5947, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3796, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 86%|########6 | 96/111 [01:04<00:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9492, LAS: 0.9059, UEM: 0.5928, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.4503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 90%|######### | 100/111 [01:06<00:07, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9496, LAS: 0.9062, UEM: 0.5967, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1409, partial_loss/deprel_loss: 0.3100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4481, loss: 0.6789, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 94%|#########3| 104/111 [01:09<00:04, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9499, LAS: 0.9066, UEM: 0.6023, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6747, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 97%|#########7| 108/111 [01:12<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9498, LAS: 0.9063, UEM: 0.5988, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6770, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 00:43:24,069 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.536 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.466 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UEM | 0.599 | N/A\n", + "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - LAS | 0.906 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - loss | 0.677 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEM | 0.364 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EM | 0.896 | N/A\n", + "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:43:24,076 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Epoch duration: 0:01:21.499439\n", + "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Estimated training time remaining: 7:07:41\n", + "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Epoch 84/399\n", + "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:43:28,790 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9514, LAS: 0.9079, UEM: 0.4796, LEM: 0.2044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5584, loss: 0.6576, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 5%|4 | 5/111 [00:02<00:45, 2.32it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9469, LAS: 0.9044, UEM: 0.4177, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.4723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.6858, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 9%|9 | 10/111 [00:04<00:44, 2.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9428, LAS: 0.9011, UEM: 0.4024, LEM: 0.1678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7110, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 14%|#3 | 15/111 [00:06<00:43, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9426, LAS: 0.9007, UEM: 0.4122, LEM: 0.1725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1330, partial_loss/deprel_loss: 0.7580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0048, loss: 0.7214, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 16%|#6 | 18/111 [00:08<00:49, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9414, LAS: 0.8983, UEM: 0.3904, LEM: 0.1592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5205, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.7382, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 19%|#8 | 21/111 [00:11<00:53, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9424, LAS: 0.8993, UEM: 0.4119, LEM: 0.1776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.4379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.7295, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 22%|##1 | 24/111 [00:13<00:54, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9434, LAS: 0.9004, UEM: 0.4380, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 0.7223, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 24%|##4 | 27/111 [00:15<00:55, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9455, LAS: 0.9026, UEM: 0.4731, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.7058, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 27%|##7 | 30/111 [00:17<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9473, LAS: 0.9042, UEM: 0.5138, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1126, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4104, loss: 0.6924, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 31%|### | 34/111 [00:20<00:52, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9434, LAS: 0.9001, UEM: 0.4985, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.7238, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 33%|###3 | 37/111 [00:22<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9439, LAS: 0.9003, UEM: 0.4910, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7008, loss: 0.7221, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 36%|###6 | 40/111 [00:24<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9448, LAS: 0.9013, UEM: 0.4970, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.7138, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 39%|###8 | 43/111 [00:26<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9465, LAS: 0.9034, UEM: 0.5256, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4916, loss: 0.6992, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 41%|####1 | 46/111 [00:28<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9223, UAS: 0.9458, LAS: 0.9026, UEM: 0.5203, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2626, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.7034, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||: 44%|####4 | 49/111 [00:31<00:43, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9466, LAS: 0.9034, UEM: 0.5216, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3617, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.6996, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 47%|####6 | 52/111 [00:33<00:41, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9474, LAS: 0.9043, UEM: 0.5501, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.3062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.6910, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 50%|##### | 56/111 [00:35<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9467, LAS: 0.9035, UEM: 0.5399, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1279, partial_loss/deprel_loss: 0.7786, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0202, loss: 0.6955, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 54%|#####4 | 60/111 [00:38<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9474, LAS: 0.9045, UEM: 0.5443, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4806, loss: 0.6883, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 58%|#####7 | 64/111 [00:40<00:30, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9474, LAS: 0.9044, UEM: 0.5436, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7734, partial_loss/deprel_loss: 0.7165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8995, loss: 0.6890, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 61%|######1 | 68/111 [00:43<00:27, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9484, LAS: 0.9054, UEM: 0.5534, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5501, loss: 0.6814, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 65%|######4 | 72/111 [00:46<00:26, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9485, LAS: 0.9056, UEM: 0.5534, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6119, partial_loss/deprel_loss: 0.5648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.6804, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 68%|######7 | 75/111 [00:48<00:25, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9488, LAS: 0.9060, UEM: 0.5591, LEM: 0.3222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2361, partial_loss/deprel_loss: 0.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4519, loss: 0.6775, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 70%|####### | 78/111 [00:51<00:25, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9494, LAS: 0.9067, UEM: 0.5780, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0818, partial_loss/deprel_loss: 0.2043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3515, loss: 0.6721, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 73%|#######2 | 81/111 [00:53<00:22, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9490, LAS: 0.9061, UEM: 0.5733, LEM: 0.3404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9083, partial_loss/deprel_loss: 0.6554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8776, loss: 0.6770, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||: 77%|#######6 | 85/111 [00:56<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9488, LAS: 0.9059, UEM: 0.5730, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1963, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4591, loss: 0.6784, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||: 80%|######## | 89/111 [00:58<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9493, LAS: 0.9065, UEM: 0.5893, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0396, partial_loss/deprel_loss: 0.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2704, loss: 0.6757, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||: 83%|########2 | 92/111 [01:01<00:14, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9494, LAS: 0.9066, UEM: 0.5906, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 0.7517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9500, loss: 0.6758, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 86%|########5 | 95/111 [01:03<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9497, LAS: 0.9070, UEM: 0.5945, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6637, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8613, loss: 0.6744, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 88%|########8 | 98/111 [01:05<00:09, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9495, LAS: 0.9067, UEM: 0.5956, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2025, partial_loss/deprel_loss: 0.8264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0732, loss: 0.6749, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 92%|#########1| 102/111 [01:08<00:06, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9498, LAS: 0.9069, UEM: 0.5952, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6735, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 95%|#########4| 105/111 [01:10<00:04, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9498, LAS: 0.9069, UEM: 0.5966, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5502, loss: 0.6728, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 98%|#########8| 109/111 [01:13<00:01, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9500, LAS: 0.9070, UEM: 0.6010, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0986, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4373, loss: 0.6715, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.307 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.099 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | N/A\n", + "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - UEM | 0.601 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LAS | 0.907 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - loss | 0.671 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEM | 0.370 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - EM | 0.935 | N/A\n", + "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:44:46,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Epoch duration: 0:01:23.490118\n", + "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Estimated training time remaining: 7:06:28\n", + "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Epoch 85/399\n", + "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:44:52,275 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:44:52,284 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9489, LAS: 0.9040, UEM: 0.4945, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4882, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7388, loss: 0.6966, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 4%|3 | 4/111 [00:02<00:59, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9493, LAS: 0.9031, UEM: 0.4720, LEM: 0.2297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8859, loss: 0.7048, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 7%|7 | 8/111 [00:04<00:59, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9508, LAS: 0.9050, UEM: 0.5020, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5759, partial_loss/deprel_loss: 0.5518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7282, loss: 0.6806, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 10%|9 | 11/111 [00:07<01:03, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9533, LAS: 0.9086, UEM: 0.5372, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.6507, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 14%|#3 | 15/111 [00:09<01:01, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9512, LAS: 0.9070, UEM: 0.5409, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.6631, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 16%|#6 | 18/111 [00:12<01:05, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9511, LAS: 0.9074, UEM: 0.5449, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2308, partial_loss/deprel_loss: 0.3370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.6610, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 19%|#8 | 21/111 [00:14<01:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9543, LAS: 0.9116, UEM: 0.6365, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2214, partial_loss/deprel_loss: 0.4003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.6342, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 22%|##1 | 24/111 [00:16<01:03, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9527, LAS: 0.9099, UEM: 0.6114, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3740, partial_loss/deprel_loss: 0.4229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6472, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||: 25%|##5 | 28/111 [00:19<00:58, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9535, LAS: 0.9106, UEM: 0.6154, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4861, loss: 0.6429, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 28%|##7 | 31/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9547, LAS: 0.9122, UEM: 0.6263, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3075, partial_loss/deprel_loss: 0.4177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6327, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 31%|### | 34/111 [00:23<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9544, LAS: 0.9119, UEM: 0.6212, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7864, loss: 0.6345, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 34%|###4 | 38/111 [00:25<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9535, LAS: 0.9111, UEM: 0.6093, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6099, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.6401, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 37%|###6 | 41/111 [00:27<00:47, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9540, LAS: 0.9116, UEM: 0.6067, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.6379, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 41%|#### | 45/111 [00:30<00:43, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9532, LAS: 0.9111, UEM: 0.5997, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 0.6122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8159, loss: 0.6409, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 44%|####4 | 49/111 [00:32<00:40, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9513, LAS: 0.9092, UEM: 0.5832, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6072, partial_loss/deprel_loss: 0.5884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6533, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 48%|####7 | 53/111 [00:35<00:39, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9512, LAS: 0.9091, UEM: 0.5850, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6603, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8126, loss: 0.6534, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||: 50%|##### | 56/111 [00:38<00:38, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9517, LAS: 0.9096, UEM: 0.5943, LEM: 0.3615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1501, partial_loss/deprel_loss: 0.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.6495, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 54%|#####4 | 60/111 [00:40<00:34, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9500, LAS: 0.9079, UEM: 0.5866, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6772, loss: 0.6611, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 58%|#####7 | 64/111 [00:43<00:31, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9503, LAS: 0.9082, UEM: 0.5875, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6555, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.6617, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 61%|######1 | 68/111 [00:46<00:30, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9508, LAS: 0.9088, UEM: 0.5997, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6568, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 64%|######3 | 71/111 [00:48<00:28, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9502, LAS: 0.9081, UEM: 0.5917, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7786, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8527, loss: 0.6633, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 67%|######6 | 74/111 [00:50<00:26, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9503, LAS: 0.9081, UEM: 0.5887, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5200, partial_loss/deprel_loss: 0.5049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.6635, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 69%|######9 | 77/111 [00:52<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9494, LAS: 0.9071, UEM: 0.5841, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.6703, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 72%|#######2 | 80/111 [00:54<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9502, LAS: 0.9081, UEM: 0.6033, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.6625, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 75%|#######4 | 83/111 [00:57<00:20, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9505, LAS: 0.9084, UEM: 0.6038, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6609, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 77%|#######7 | 86/111 [00:59<00:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9498, LAS: 0.9076, UEM: 0.5981, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9836, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9079, loss: 0.6671, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 81%|########1 | 90/111 [01:01<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9492, LAS: 0.9069, UEM: 0.5945, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7101, partial_loss/deprel_loss: 0.6880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8639, loss: 0.6734, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 85%|########4 | 94/111 [01:04<00:11, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8769, UAS: 0.9493, LAS: 0.9069, UEM: 0.5976, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9722, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9228, loss: 0.6741, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 87%|########7 | 97/111 [01:06<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9496, LAS: 0.9071, UEM: 0.5950, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7420, partial_loss/deprel_loss: 0.7137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.6729, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||: 92%|#########1| 102/111 [01:08<00:05, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9499, LAS: 0.9075, UEM: 0.5979, LEM: 0.3685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6889, loss: 0.6693, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||: 96%|#########6| 107/111 [01:11<00:02, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9504, LAS: 0.9079, UEM: 0.6026, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2185, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5080, loss: 0.6663, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:13<00:00, 1.52it/s]\n", + "2023-04-07 00:46:08,660 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9122, LAS: 0.8613, UEM: 0.3719, LEM: 0.1357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6872, partial_loss/deprel_loss: 33.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 27.1136, loss: 36.1110, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.03s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9236, LAS: 0.8697, UEM: 0.3147, LEM: 0.0932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 47.1769, partial_loss/cycle_loss: 0.0000, batch_loss: 38.0038, loss: 32.5457, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:08, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9373, LAS: 0.8872, UEM: 0.6018, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1716, partial_loss/deprel_loss: 19.2356, partial_loss/cycle_loss: 0.0000, batch_loss: 15.4228, loss: 28.2524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:05, 1.00s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9431, LAS: 0.8932, UEM: 0.6361, LEM: 0.3959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 23.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5378, loss: 26.2134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.366 | 25.873\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.218 | 0.395\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - reg_loss | 0.172 | 0.000\n", + "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UEM | 0.603 | 0.647\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LAS | 0.908 | 0.896\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - loss | 0.666 | 25.248\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEM | 0.371 | 0.386\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | 0.946\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EM | 0.927 | 0.916\n", + "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:46:21,318 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Epoch duration: 0:01:33.977591\n", + "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Estimated training time remaining: 7:05:54\n", + "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Epoch 86/399\n", + "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:46:26,253 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:46:26,259 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9549, LAS: 0.9143, UEM: 0.5126, LEM: 0.2644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.5818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7569, loss: 0.6319, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 4%|3 | 4/111 [00:02<01:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9574, LAS: 0.9172, UEM: 0.5572, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5092, loss: 0.6052, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 6%|6 | 7/111 [00:04<01:09, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9556, LAS: 0.9147, UEM: 0.5295, LEM: 0.2703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.6292, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 9%|9 | 10/111 [00:06<01:08, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9560, LAS: 0.9151, UEM: 0.5308, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4331, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 0.6216, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 12%|#1 | 13/111 [00:08<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9553, LAS: 0.9142, UEM: 0.5352, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.4334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.6263, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 15%|#5 | 17/111 [00:11<01:03, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9548, LAS: 0.9133, UEM: 0.5388, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2227, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.6341, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 18%|#8 | 20/111 [00:13<01:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9508, LAS: 0.9089, UEM: 0.5216, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 22%|##1 | 24/111 [00:15<00:56, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9503, LAS: 0.9078, UEM: 0.5263, LEM: 0.2784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1759, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6687, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 24%|##4 | 27/111 [00:18<00:58, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9507, LAS: 0.9085, UEM: 0.5438, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.6630, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 28%|##7 | 31/111 [00:20<00:53, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9506, LAS: 0.9088, UEM: 0.5685, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7128, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 31%|### | 34/111 [00:22<00:52, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9505, LAS: 0.9085, UEM: 0.5655, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2677, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 34%|###4 | 38/111 [00:25<00:49, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9513, LAS: 0.9093, UEM: 0.5822, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.2598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4080, loss: 0.6536, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 37%|###6 | 41/111 [00:27<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9521, LAS: 0.9097, UEM: 0.5914, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.4478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6479, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 40%|###9 | 44/111 [00:30<00:48, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9506, LAS: 0.9082, UEM: 0.5772, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0487, partial_loss/deprel_loss: 0.7064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9462, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||: 42%|####2 | 47/111 [00:32<00:45, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9518, LAS: 0.9095, UEM: 0.5924, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.6508, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 46%|####5 | 51/111 [00:34<00:42, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9527, LAS: 0.9100, UEM: 0.5966, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2301, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.6473, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 50%|####9 | 55/111 [00:37<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9522, LAS: 0.9094, UEM: 0.6012, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1176, partial_loss/deprel_loss: 0.3189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.6513, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 53%|#####3 | 59/111 [00:40<00:35, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9524, LAS: 0.9098, UEM: 0.5956, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4422, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 0.6495, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 57%|#####6 | 63/111 [00:42<00:31, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9516, LAS: 0.9088, UEM: 0.5877, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3114, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6568, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 60%|###### | 67/111 [00:44<00:27, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9507, LAS: 0.9080, UEM: 0.5830, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.6379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.6621, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 65%|######4 | 72/111 [00:47<00:22, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9501, LAS: 0.9074, UEM: 0.5871, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 0.8042, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0473, loss: 0.6673, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 69%|######9 | 77/111 [00:49<00:18, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9510, LAS: 0.9086, UEM: 0.6098, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2064, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4838, loss: 0.6614, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 73%|#######2 | 81/111 [00:51<00:16, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9511, LAS: 0.9085, UEM: 0.6124, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3728, partial_loss/deprel_loss: 0.4867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.6604, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 77%|#######6 | 85/111 [00:55<00:16, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9501, LAS: 0.9075, UEM: 0.6048, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8220, loss: 0.6699, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 80%|######## | 89/111 [00:58<00:14, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9502, LAS: 0.9077, UEM: 0.6015, LEM: 0.3738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4820, loss: 0.6682, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 84%|########3 | 93/111 [01:00<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9506, LAS: 0.9082, UEM: 0.6050, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2539, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.6638, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 87%|########7 | 97/111 [01:03<00:09, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9503, LAS: 0.9078, UEM: 0.5996, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.6678, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||: 90%|######### | 100/111 [01:05<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9505, LAS: 0.9079, UEM: 0.6015, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6447, partial_loss/deprel_loss: 0.5784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.6663, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 94%|#########3| 104/111 [01:08<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9501, LAS: 0.9076, UEM: 0.5952, LEM: 0.3664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7687, loss: 0.6689, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 97%|#########7| 108/111 [01:10<00:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9503, LAS: 0.9078, UEM: 0.6002, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5065, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.6659, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 00:47:43,046 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.534 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.506 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UEM | 0.600 | N/A\n", + "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - LAS | 0.908 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - loss | 0.666 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEM | 0.371 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EM | 0.902 | N/A\n", + "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:47:43,053 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:47:49,210 - INFO - combo.training.trainer - Epoch duration: 0:01:22.957862\n", + "2023-04-07 00:47:49,211 - INFO - combo.training.trainer - Estimated training time remaining: 7:04:38\n", + "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Epoch 87/399\n", + "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:47:49,212 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:47:49,221 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9687, LAS: 0.9283, UEM: 0.6917, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.5496, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9621, LAS: 0.9222, UEM: 0.7021, LEM: 0.4715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1045, partial_loss/deprel_loss: 0.2157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3647, loss: 0.5783, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 5%|5 | 6/111 [00:04<01:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9557, LAS: 0.9144, UEM: 0.6255, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5098, loss: 0.6403, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 9%|9 | 10/111 [00:07<01:11, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9478, LAS: 0.9059, UEM: 0.5568, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8828, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8597, loss: 0.6974, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 13%|#2 | 14/111 [00:09<01:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9500, LAS: 0.9077, UEM: 0.5914, LEM: 0.3698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1040, partial_loss/deprel_loss: 0.3227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4502, loss: 0.6824, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 15%|#5 | 17/111 [00:11<01:06, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9514, LAS: 0.9091, UEM: 0.6130, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1171, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4015, loss: 0.6680, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 18%|#8 | 20/111 [00:14<01:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9511, LAS: 0.9090, UEM: 0.5950, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7511, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.6676, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||: 21%|## | 23/111 [00:16<01:01, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9521, LAS: 0.9100, UEM: 0.5844, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4836, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6586, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||: 24%|##4 | 27/111 [00:18<00:55, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9511, LAS: 0.9096, UEM: 0.5885, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5662, loss: 0.6604, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||: 28%|##7 | 31/111 [00:21<00:52, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9496, LAS: 0.9082, UEM: 0.5715, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8570, loss: 0.6712, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||: 32%|###1 | 35/111 [00:23<00:49, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9515, LAS: 0.9106, UEM: 0.5987, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4673, loss: 0.6518, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 35%|###5 | 39/111 [00:27<00:51, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9506, LAS: 0.9096, UEM: 0.5906, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2880, partial_loss/deprel_loss: 0.8245, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0884, loss: 0.6588, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 38%|###7 | 42/111 [00:29<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9517, LAS: 0.9103, UEM: 0.6028, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5693, loss: 0.6515, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 41%|####1 | 46/111 [00:31<00:42, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9519, LAS: 0.9103, UEM: 0.5993, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7766, partial_loss/deprel_loss: 0.5683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7812, loss: 0.6519, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 46%|####5 | 51/111 [00:33<00:36, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9516, LAS: 0.9102, UEM: 0.6066, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.6525, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 50%|####9 | 55/111 [00:36<00:35, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9505, LAS: 0.9089, UEM: 0.5934, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0241, partial_loss/deprel_loss: 0.7608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9846, loss: 0.6616, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 53%|#####3 | 59/111 [00:38<00:31, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9507, LAS: 0.9092, UEM: 0.6009, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6563, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 57%|#####6 | 63/111 [00:41<00:29, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9497, LAS: 0.9081, UEM: 0.5987, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.3651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6632, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 60%|###### | 67/111 [00:43<00:27, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9490, LAS: 0.9072, UEM: 0.5947, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4450, partial_loss/deprel_loss: 0.8776, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1623, loss: 0.6706, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 65%|######4 | 72/111 [00:46<00:23, 1.69it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9487, LAS: 0.9068, UEM: 0.5909, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.6724, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 69%|######9 | 77/111 [00:48<00:18, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9488, LAS: 0.9069, UEM: 0.5854, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3230, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.6719, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 73%|#######2 | 81/111 [00:51<00:17, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9492, LAS: 0.9074, UEM: 0.6009, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8553, loss: 0.6688, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 77%|#######6 | 85/111 [00:54<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9496, LAS: 0.9078, UEM: 0.6041, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.6651, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||: 80%|######## | 89/111 [00:57<00:14, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9493, LAS: 0.9073, UEM: 0.5980, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4866, partial_loss/deprel_loss: 0.4848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.6681, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 84%|########3 | 93/111 [01:00<00:12, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9491, LAS: 0.9071, UEM: 0.5911, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3899, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6705, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 87%|########7 | 97/111 [01:03<00:10, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9496, LAS: 0.9077, UEM: 0.5966, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5616, loss: 0.6659, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 91%|######### | 101/111 [01:05<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9502, LAS: 0.9085, UEM: 0.6076, LEM: 0.3781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5397, loss: 0.6596, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 95%|#########4| 105/111 [01:08<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9502, LAS: 0.9084, UEM: 0.6053, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5986, loss: 0.6600, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 98%|#########8| 109/111 [01:11<00:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9501, LAS: 0.9082, UEM: 0.6015, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7131, partial_loss/deprel_loss: 0.6420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.6628, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.642 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.713 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UEM | 0.601 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LAS | 0.908 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - loss | 0.663 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEM | 0.372 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EM | 0.893 | N/A\n", + "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:49:05,048 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Epoch duration: 0:01:20.806982\n", + "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:03:15\n", + "2023-04-07 00:49:10,018 - INFO - allennlp.training.trainer - Epoch 88/399\n", + "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:49:10,028 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9648, LAS: 0.9244, UEM: 0.6771, LEM: 0.4049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3842, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6010, loss: 0.5365, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 4%|3 | 4/111 [00:02<01:08, 1.56it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9613, LAS: 0.9201, UEM: 0.6885, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1407, partial_loss/deprel_loss: 0.2453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5656, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 6%|6 | 7/111 [00:04<01:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9565, LAS: 0.9148, UEM: 0.6298, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8094, partial_loss/deprel_loss: 0.6079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8192, loss: 0.6131, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 10%|9 | 11/111 [00:07<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9537, LAS: 0.9116, UEM: 0.6465, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4722, partial_loss/deprel_loss: 0.4675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.6314, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 13%|#2 | 14/111 [00:09<01:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9516, LAS: 0.9094, UEM: 0.6364, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2188, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.6542, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 16%|#6 | 18/111 [00:12<01:01, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9494, LAS: 0.9073, UEM: 0.6218, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7928, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 20%|#9 | 22/111 [00:14<00:58, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9493, LAS: 0.9074, UEM: 0.6181, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7434, loss: 0.6665, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 23%|##2 | 25/111 [00:16<00:58, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9479, LAS: 0.9056, UEM: 0.5939, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5422, partial_loss/deprel_loss: 0.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6942, loss: 0.6767, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 25%|##5 | 28/111 [00:19<00:57, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9484, LAS: 0.9059, UEM: 0.6016, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1821, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4843, loss: 0.6760, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 28%|##7 | 31/111 [00:21<01:00, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9486, LAS: 0.9059, UEM: 0.5937, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7760, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.6750, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 32%|###1 | 35/111 [00:24<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9470, LAS: 0.9040, UEM: 0.5709, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6367, partial_loss/deprel_loss: 0.6364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8075, loss: 0.6898, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 35%|###5 | 39/111 [00:26<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9056, UEM: 0.5839, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.6773, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 39%|###8 | 43/111 [00:29<00:47, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9492, LAS: 0.9066, UEM: 0.5935, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 0.3325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||: 42%|####2 | 47/111 [00:31<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9481, LAS: 0.9053, UEM: 0.5892, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.6769, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 47%|####6 | 52/111 [00:34<00:35, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9481, LAS: 0.9055, UEM: 0.5862, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5692, loss: 0.6759, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 51%|#####1 | 57/111 [00:36<00:30, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9497, LAS: 0.9070, UEM: 0.5991, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1718, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6644, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 56%|#####5 | 62/111 [00:38<00:25, 1.92it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9489, LAS: 0.9063, UEM: 0.5947, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5362, loss: 0.6699, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 59%|#####9 | 66/111 [00:41<00:25, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9494, LAS: 0.9067, UEM: 0.5983, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1346, partial_loss/deprel_loss: 0.2575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.6678, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 63%|######3 | 70/111 [00:43<00:23, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9503, LAS: 0.9076, UEM: 0.6103, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.6601, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 67%|######6 | 74/111 [00:46<00:23, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9505, LAS: 0.9081, UEM: 0.6227, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7462, loss: 0.6569, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 70%|####### | 78/111 [00:50<00:22, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9508, LAS: 0.9084, UEM: 0.6206, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6562, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 74%|#######3 | 82/111 [00:52<00:20, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9510, LAS: 0.9085, UEM: 0.6165, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3369, partial_loss/deprel_loss: 0.5227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6566, loss: 0.6572, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||: 77%|#######6 | 85/111 [00:55<00:18, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9511, LAS: 0.9085, UEM: 0.6129, LEM: 0.3792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5236, partial_loss/deprel_loss: 0.5315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7009, loss: 0.6570, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 79%|#######9 | 88/111 [00:57<00:16, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9504, LAS: 0.9078, UEM: 0.6034, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6980, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8108, loss: 0.6609, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 83%|########2 | 92/111 [00:59<00:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9509, LAS: 0.9082, UEM: 0.6093, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3124, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 0.6571, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 86%|########5 | 95/111 [01:02<00:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9513, LAS: 0.9088, UEM: 0.6183, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.6536, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 88%|########8 | 98/111 [01:04<00:09, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9511, LAS: 0.9085, UEM: 0.6137, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8182, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9121, loss: 0.6563, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 92%|#########1| 102/111 [01:07<00:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9506, LAS: 0.9079, UEM: 0.6094, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6152, partial_loss/deprel_loss: 0.6973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8518, loss: 0.6612, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 95%|#########5| 106/111 [01:09<00:03, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9504, LAS: 0.9075, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8294, partial_loss/deprel_loss: 0.6723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8747, loss: 0.6649, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 99%|#########9| 110/111 [01:11<00:00, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9503, LAS: 0.9075, UEM: 0.6013, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7436, loss: 0.6656, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.571 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.580 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UEM | 0.601 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LAS | 0.907 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - loss | 0.666 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEM | 0.372 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UAS | 0.950 | N/A\n", + "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - EM | 0.903 | N/A\n", + "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:50:25,584 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:50:30,371 - INFO - combo.training.trainer - Epoch duration: 0:01:20.352845\n", + "2023-04-07 00:50:30,372 - INFO - combo.training.trainer - Estimated training time remaining: 7:01:50\n", + "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Epoch 89/399\n", + "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:50:30,373 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:50:30,382 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9624, LAS: 0.9199, UEM: 0.6179, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.4097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.5893, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 3%|2 | 3/111 [00:02<01:13, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9575, LAS: 0.9151, UEM: 0.6054, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4951, partial_loss/deprel_loss: 0.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6034, batch_reg_loss: 0.1709, reg_loss: 0.1710 ||: 5%|5 | 6/111 [00:04<01:11, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9608, LAS: 0.9188, UEM: 0.6575, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2058, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.5747, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 8%|8 | 9/111 [00:06<01:13, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9648, UAS: 0.9584, LAS: 0.9174, UEM: 0.7075, LEM: 0.4978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0484, partial_loss/deprel_loss: 0.1350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2886, loss: 0.5920, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 12%|#1 | 13/111 [00:09<01:12, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9516, LAS: 0.9103, UEM: 0.6846, LEM: 0.4747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5908, partial_loss/deprel_loss: 0.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2522, loss: 0.6493, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 14%|#4 | 16/111 [00:14<01:31, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9528, LAS: 0.9117, UEM: 0.6715, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.6407, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 18%|#8 | 20/111 [00:16<01:18, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9546, LAS: 0.9136, UEM: 0.6846, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6282, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 21%|## | 23/111 [00:18<01:10, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9526, LAS: 0.9115, UEM: 0.6587, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6559, partial_loss/deprel_loss: 0.6576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.6451, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 24%|##4 | 27/111 [00:20<01:00, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9520, LAS: 0.9108, UEM: 0.6580, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.6525, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 29%|##8 | 32/111 [00:23<00:52, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9523, LAS: 0.9115, UEM: 0.6451, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2655, partial_loss/deprel_loss: 0.3666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6465, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 33%|###3 | 37/111 [00:25<00:44, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9529, LAS: 0.9117, UEM: 0.6360, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3649, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5989, loss: 0.6419, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 38%|###7 | 42/111 [00:27<00:37, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9533, LAS: 0.9119, UEM: 0.6308, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6191, loss: 0.6401, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 41%|####1 | 46/111 [00:30<00:37, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9530, LAS: 0.9112, UEM: 0.6381, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4505, partial_loss/deprel_loss: 0.6057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.6447, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 45%|####5 | 50/111 [00:33<00:36, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9541, LAS: 0.9121, UEM: 0.6467, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.4205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.6382, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 49%|####8 | 54/111 [00:35<00:35, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9531, LAS: 0.9111, UEM: 0.6393, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7622, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.6446, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 52%|#####2 | 58/111 [00:38<00:33, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9534, LAS: 0.9116, UEM: 0.6483, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.5976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8129, loss: 0.6389, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 56%|#####5 | 62/111 [00:41<00:32, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9523, LAS: 0.9106, UEM: 0.6397, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7800, partial_loss/deprel_loss: 0.5918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.6471, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 59%|#####9 | 66/111 [00:44<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9529, LAS: 0.9111, UEM: 0.6421, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.6425, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 63%|######3 | 70/111 [00:46<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9534, LAS: 0.9117, UEM: 0.6431, LEM: 0.4159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2698, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.6379, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||: 66%|######5 | 73/111 [00:49<00:26, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9525, LAS: 0.9106, UEM: 0.6362, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3974, partial_loss/deprel_loss: 0.8038, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0934, loss: 0.6450, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 68%|######8 | 76/111 [00:51<00:24, 1.46it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9526, LAS: 0.9106, UEM: 0.6360, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.6453, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 71%|#######1 | 79/111 [00:53<00:22, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9524, LAS: 0.9105, UEM: 0.6310, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3757, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6165, loss: 0.6464, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 75%|#######4 | 83/111 [00:55<00:18, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9519, LAS: 0.9099, UEM: 0.6210, LEM: 0.3966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6011, partial_loss/deprel_loss: 0.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.6522, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 78%|#######8 | 87/111 [00:58<00:15, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9520, LAS: 0.9102, UEM: 0.6168, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4617, loss: 0.6498, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 82%|########1 | 91/111 [01:00<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9522, LAS: 0.9103, UEM: 0.6161, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.4240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.6488, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 85%|########4 | 94/111 [01:02<00:11, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9523, LAS: 0.9104, UEM: 0.6158, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2154, partial_loss/deprel_loss: 0.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6470, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 87%|########7 | 97/111 [01:05<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9526, LAS: 0.9105, UEM: 0.6182, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6561, loss: 0.6454, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 91%|######### | 101/111 [01:07<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9519, LAS: 0.9096, UEM: 0.6129, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.6513, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 94%|#########3| 104/111 [01:09<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9515, LAS: 0.9093, UEM: 0.6072, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6124, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7494, loss: 0.6536, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 97%|#########7| 108/111 [01:12<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 00:51:48,085 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.515 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.425 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UEM | 0.605 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LAS | 0.909 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - loss | 0.654 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LEM | 0.377 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - UAS | 0.951 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EM | 0.909 | N/A\n", + "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:51:48,092 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Epoch duration: 0:01:23.555709\n", + "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Estimated training time remaining: 7:00:36\n", + "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Epoch 90/399\n", + "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:51:53,929 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:51:53,937 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9586, LAS: 0.9155, UEM: 0.5270, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4390, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.6227, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 4%|3 | 4/111 [00:02<01:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9620, LAS: 0.9203, UEM: 0.6100, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3636, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.5838, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 6%|6 | 7/111 [00:05<01:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9583, LAS: 0.9171, UEM: 0.6267, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8749, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8585, loss: 0.6021, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 10%|9 | 11/111 [00:07<01:05, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9531, LAS: 0.9121, UEM: 0.5706, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9044, partial_loss/deprel_loss: 0.6860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9005, loss: 0.6420, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 14%|#4 | 16/111 [00:09<00:56, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9505, LAS: 0.9098, UEM: 0.5415, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0960, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9841, loss: 0.6564, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 19%|#8 | 21/111 [00:11<00:50, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9539, LAS: 0.9130, UEM: 0.6156, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3574, loss: 0.6258, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 23%|##3 | 26/111 [00:14<00:48, 1.77it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9558, LAS: 0.9152, UEM: 0.6321, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6117, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 27%|##7 | 30/111 [00:17<00:47, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9541, LAS: 0.9137, UEM: 0.6241, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0644, partial_loss/deprel_loss: 0.7645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9952, loss: 0.6239, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 31%|### | 34/111 [00:20<00:48, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9553, LAS: 0.9151, UEM: 0.6368, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2827, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.6155, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||: 34%|###4 | 38/111 [00:22<00:44, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9557, LAS: 0.9154, UEM: 0.6404, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1780, partial_loss/deprel_loss: 0.3391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.6130, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 38%|###7 | 42/111 [00:25<00:44, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9546, LAS: 0.9140, UEM: 0.6388, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9500, partial_loss/deprel_loss: 0.6070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.6205, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 41%|####1 | 46/111 [00:28<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9547, LAS: 0.9141, UEM: 0.6337, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3840, partial_loss/deprel_loss: 0.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6183, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 45%|####5 | 50/111 [00:30<00:39, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9541, LAS: 0.9134, UEM: 0.6280, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6211, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 49%|####8 | 54/111 [00:33<00:37, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9543, LAS: 0.9132, UEM: 0.6260, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6095, loss: 0.6207, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 52%|#####2 | 58/111 [00:36<00:36, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9543, LAS: 0.9130, UEM: 0.6279, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2470, partial_loss/deprel_loss: 0.3760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.6219, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 55%|#####4 | 61/111 [00:38<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9539, LAS: 0.9125, UEM: 0.6219, LEM: 0.3795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5638, partial_loss/deprel_loss: 0.5155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.6253, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 59%|#####8 | 65/111 [00:41<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9537, LAS: 0.9121, UEM: 0.6204, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8245, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8897, loss: 0.6278, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 61%|######1 | 68/111 [00:43<00:29, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9538, LAS: 0.9124, UEM: 0.6296, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0910, partial_loss/deprel_loss: 0.2150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3609, loss: 0.6257, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||: 64%|######3 | 71/111 [00:45<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9534, LAS: 0.9119, UEM: 0.6202, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3472, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 68%|######7 | 75/111 [00:48<00:25, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9531, LAS: 0.9114, UEM: 0.6143, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8013, partial_loss/deprel_loss: 0.6878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8812, loss: 0.6355, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 70%|####### | 78/111 [00:50<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9531, LAS: 0.9113, UEM: 0.6071, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5766, partial_loss/deprel_loss: 0.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7825, loss: 0.6377, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 74%|#######3 | 82/111 [00:53<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9525, LAS: 0.9106, UEM: 0.6012, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4863, partial_loss/deprel_loss: 0.5547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.6427, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 77%|#######6 | 85/111 [00:55<00:17, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9518, LAS: 0.9098, UEM: 0.5942, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7252, partial_loss/deprel_loss: 0.6054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6498, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 79%|#######9 | 88/111 [00:57<00:15, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9520, LAS: 0.9100, UEM: 0.5902, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6494, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 83%|########2 | 92/111 [00:59<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9525, LAS: 0.9105, UEM: 0.5960, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1836, partial_loss/deprel_loss: 0.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6452, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 86%|########5 | 95/111 [01:02<00:11, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9515, LAS: 0.9095, UEM: 0.5901, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6474, partial_loss/deprel_loss: 0.6101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7882, loss: 0.6541, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 89%|########9 | 99/111 [01:04<00:08, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9516, LAS: 0.9096, UEM: 0.5925, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.6533, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 92%|#########1| 102/111 [01:07<00:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9509, LAS: 0.9089, UEM: 0.5867, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5455, partial_loss/deprel_loss: 0.5296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.6580, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 95%|#########4| 105/111 [01:09<00:04, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9513, LAS: 0.9093, UEM: 0.5920, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5731, loss: 0.6548, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 97%|#########7| 108/111 [01:11<00:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-07 00:53:10,727 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9666, LAS: 0.9178, UEM: 0.7733, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4139, partial_loss/deprel_loss: 25.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 20.6140, loss: 19.3419, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9579, LAS: 0.9100, UEM: 0.7512, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9262, partial_loss/deprel_loss: 35.7394, partial_loss/cycle_loss: 0.0000, batch_loss: 28.7767, loss: 21.8718, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:05<00:04, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9531, LAS: 0.9020, UEM: 0.6854, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7791, partial_loss/deprel_loss: 28.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3162, loss: 23.2931, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:07<00:01, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9464, LAS: 0.8943, UEM: 0.6498, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7166, partial_loss/deprel_loss: 55.2239, partial_loss/cycle_loss: 0.0000, batch_loss: 44.5224, loss: 25.0047, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:09<00:00, 1.39it/s]\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.569 | 55.224\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.614 | 1.717\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | 0.000\n", + "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UEM | 0.603 | 0.650\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LAS | 0.910 | 0.894\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - loss | 0.654 | 25.005\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEM | 0.372 | 0.386\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - UAS | 0.951 | 0.946\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EM | 0.904 | 0.829\n", + "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:53:20,063 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Epoch duration: 0:01:30.925328\n", + "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Estimated training time remaining: 6:59:47\n", + "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Epoch 91/399\n", + "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:53:24,855 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:53:24,864 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9196, LAS: 0.8740, UEM: 0.1556, LEM: 0.0356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5877, partial_loss/deprel_loss: 0.9074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2141, loss: 0.9081, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 3%|2 | 3/111 [00:02<01:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9417, LAS: 0.9000, UEM: 0.5139, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5749, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.7202, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 6%|6 | 7/111 [00:04<01:12, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9332, LAS: 0.8911, UEM: 0.4231, LEM: 0.2178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9388, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9358, loss: 0.7898, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 10%|9 | 11/111 [00:07<01:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9391, LAS: 0.8975, UEM: 0.5123, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.6334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8161, loss: 0.7382, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 14%|#3 | 15/111 [00:09<01:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9411, LAS: 0.8992, UEM: 0.4980, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.3629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.7306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 16%|#6 | 18/111 [00:11<01:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9448, LAS: 0.9035, UEM: 0.5821, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4230, loss: 0.6973, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 19%|#8 | 21/111 [00:14<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9467, LAS: 0.9060, UEM: 0.5947, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1693, partial_loss/deprel_loss: 0.2629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.6790, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 22%|##1 | 24/111 [00:16<01:03, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9484, LAS: 0.9081, UEM: 0.5871, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2777, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.6673, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 25%|##5 | 28/111 [00:18<00:57, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9507, LAS: 0.9106, UEM: 0.6326, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3565, partial_loss/deprel_loss: 0.4421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5957, loss: 0.6473, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 28%|##7 | 31/111 [00:21<00:58, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9501, LAS: 0.9099, UEM: 0.6233, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1390, partial_loss/deprel_loss: 0.7462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.6526, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 32%|###1 | 35/111 [00:23<00:53, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9501, LAS: 0.9099, UEM: 0.6146, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7562, partial_loss/deprel_loss: 0.6199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 34%|###4 | 38/111 [00:26<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9507, LAS: 0.9103, UEM: 0.6202, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0333, partial_loss/deprel_loss: 0.7240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9565, loss: 0.6498, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 38%|###7 | 42/111 [00:28<00:47, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9501, LAS: 0.9096, UEM: 0.6078, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0019, partial_loss/deprel_loss: 0.5839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8381, loss: 0.6546, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 41%|####1 | 46/111 [00:31<00:42, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9508, LAS: 0.9102, UEM: 0.6114, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2693, partial_loss/deprel_loss: 0.4158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.6488, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 45%|####5 | 50/111 [00:33<00:40, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9505, LAS: 0.9100, UEM: 0.6099, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5179, loss: 0.6507, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 49%|####8 | 54/111 [00:36<00:38, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9514, LAS: 0.9109, UEM: 0.6192, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3527, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.6443, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||: 52%|#####2 | 58/111 [00:39<00:36, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9515, LAS: 0.9108, UEM: 0.6114, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6184, partial_loss/deprel_loss: 0.5387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7252, loss: 0.6485, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 56%|#####5 | 62/111 [00:42<00:33, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9513, LAS: 0.9104, UEM: 0.6053, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 59%|#####9 | 66/111 [00:44<00:30, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9512, LAS: 0.9098, UEM: 0.5997, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4839, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.6560, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 63%|######3 | 70/111 [00:47<00:28, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9520, LAS: 0.9109, UEM: 0.6199, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2920, loss: 0.6489, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 66%|######5 | 73/111 [00:49<00:27, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9522, LAS: 0.9109, UEM: 0.6165, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.6500, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 68%|######8 | 76/111 [00:52<00:25, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9519, LAS: 0.9106, UEM: 0.6132, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7848, partial_loss/deprel_loss: 0.6318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8330, loss: 0.6508, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 71%|#######1 | 79/111 [00:54<00:23, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9523, LAS: 0.9111, UEM: 0.6146, LEM: 0.3882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2224, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6476, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 74%|#######3 | 82/111 [00:56<00:20, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9525, LAS: 0.9114, UEM: 0.6173, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7428, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7697, loss: 0.6460, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||: 77%|#######6 | 85/111 [00:58<00:19, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9521, LAS: 0.9110, UEM: 0.6158, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2247, partial_loss/deprel_loss: 0.3346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.6467, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 81%|########1 | 90/111 [01:01<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9520, LAS: 0.9106, UEM: 0.6101, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7335, loss: 0.6502, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 85%|########4 | 94/111 [01:03<00:10, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9528, LAS: 0.9115, UEM: 0.6231, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.6430, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 88%|########8 | 98/111 [01:06<00:08, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9529, LAS: 0.9116, UEM: 0.6202, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6575, partial_loss/deprel_loss: 0.6112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7910, loss: 0.6424, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 92%|#########1| 102/111 [01:08<00:05, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9525, LAS: 0.9110, UEM: 0.6148, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5890, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6965, loss: 0.6469, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 95%|#########5| 106/111 [01:11<00:03, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9521, LAS: 0.9106, UEM: 0.6092, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.7078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.6498, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 99%|#########9| 110/111 [01:13<00:00, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9520, LAS: 0.9104, UEM: 0.6071, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8246, partial_loss/deprel_loss: 0.6674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8694, loss: 0.6518, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.667 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.825 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - reg_loss | 0.171 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UEM | 0.607 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LAS | 0.910 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - loss | 0.652 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEM | 0.378 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UAS | 0.952 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EM | 0.891 | N/A\n", + "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:54:41,921 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:54:46,283 - INFO - combo.training.trainer - Epoch duration: 0:01:21.429347\n", + "2023-04-07 00:54:46,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:58:25\n", + "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Epoch 92/399\n", + "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:54:46,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:54:46,293 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9542, LAS: 0.9139, UEM: 0.7424, LEM: 0.5818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5152, partial_loss/deprel_loss: 0.5199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.6134, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 3%|2 | 3/111 [00:02<01:21, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9479, LAS: 0.9073, UEM: 0.6124, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5882, loss: 0.6523, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 5%|5 | 6/111 [00:04<01:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9463, LAS: 0.9048, UEM: 0.6333, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4584, loss: 0.6718, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 9%|9 | 10/111 [00:06<01:11, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9422, LAS: 0.9000, UEM: 0.5906, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4059, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.7008, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 12%|#1 | 13/111 [00:09<01:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9447, LAS: 0.9030, UEM: 0.5856, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6912, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 15%|#5 | 17/111 [00:11<01:06, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9470, LAS: 0.9053, UEM: 0.5853, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2329, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.6773, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 19%|#8 | 21/111 [00:14<01:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9460, LAS: 0.9037, UEM: 0.5511, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.5975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.6872, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 23%|##2 | 25/111 [00:16<00:55, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9480, LAS: 0.9061, UEM: 0.5590, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.3937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.6726, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||: 26%|##6 | 29/111 [00:19<00:52, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9489, LAS: 0.9070, UEM: 0.5670, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.6676, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 29%|##8 | 32/111 [00:21<00:52, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9491, LAS: 0.9076, UEM: 0.5801, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1063, partial_loss/deprel_loss: 0.2096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3594, loss: 0.6631, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 32%|###1 | 35/111 [00:23<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9488, LAS: 0.9072, UEM: 0.5672, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3363, partial_loss/deprel_loss: 0.4694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6132, loss: 0.6686, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 34%|###4 | 38/111 [00:25<00:52, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9494, LAS: 0.9079, UEM: 0.5780, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.6623, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 37%|###6 | 41/111 [00:28<00:51, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9505, LAS: 0.9092, UEM: 0.5912, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6529, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 40%|###9 | 44/111 [00:30<00:48, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9502, LAS: 0.9091, UEM: 0.5955, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2522, partial_loss/deprel_loss: 0.6656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9533, loss: 0.6536, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 42%|####2 | 47/111 [00:32<00:47, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9506, LAS: 0.9097, UEM: 0.5931, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6486, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 45%|####5 | 50/111 [00:35<00:47, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9503, LAS: 0.9092, UEM: 0.5891, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4746, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6548, loss: 0.6510, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 49%|####8 | 54/111 [00:37<00:40, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9506, LAS: 0.9095, UEM: 0.5857, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3050, partial_loss/deprel_loss: 0.3623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5212, loss: 0.6479, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||: 51%|#####1 | 57/111 [00:39<00:39, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9105, UEM: 0.5931, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.2933, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4419, loss: 0.6429, batch_reg_loss: 0.1704, reg_loss: 0.1704 ||: 55%|#####4 | 61/111 [00:42<00:35, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9504, LAS: 0.9094, UEM: 0.5806, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6265, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.6522, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 59%|#####8 | 65/111 [00:44<00:31, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9501, LAS: 0.9092, UEM: 0.5760, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9519, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8500, loss: 0.6552, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 62%|######2 | 69/111 [00:47<00:27, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9514, LAS: 0.9108, UEM: 0.6083, LEM: 0.3858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4295, partial_loss/deprel_loss: 0.4640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 66%|######5 | 73/111 [00:50<00:26, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9524, LAS: 0.9119, UEM: 0.6201, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3675, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.6368, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 69%|######9 | 77/111 [00:53<00:23, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9531, LAS: 0.9123, UEM: 0.6260, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1469, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.6328, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 72%|#######2 | 80/111 [00:55<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9530, LAS: 0.9125, UEM: 0.6196, LEM: 0.3912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6422, partial_loss/deprel_loss: 0.5340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7260, loss: 0.6324, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 76%|#######5 | 84/111 [00:57<00:17, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9531, LAS: 0.9127, UEM: 0.6151, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3872, partial_loss/deprel_loss: 0.4186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.6309, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 79%|#######9 | 88/111 [00:59<00:14, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9534, LAS: 0.9129, UEM: 0.6182, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.6296, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||: 83%|########2 | 92/111 [01:02<00:11, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9536, LAS: 0.9132, UEM: 0.6242, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4462, loss: 0.6277, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 86%|########6 | 96/111 [01:04<00:08, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9539, LAS: 0.9134, UEM: 0.6223, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5956, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7169, loss: 0.6272, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 91%|######### | 101/111 [01:06<00:05, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9542, LAS: 0.9139, UEM: 0.6224, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2040, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.6243, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 95%|#########5| 106/111 [01:09<00:02, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9536, LAS: 0.9133, UEM: 0.6157, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3588, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6290, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 99%|#########9| 110/111 [01:12<00:00, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9536, LAS: 0.9133, UEM: 0.6142, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4580, partial_loss/deprel_loss: 0.4665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6350, loss: 0.6291, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.467 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.458 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - reg_loss | 0.170 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UEM | 0.614 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LAS | 0.913 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - loss | 0.629 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEM | 0.387 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UAS | 0.954 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EM | 0.915 | N/A\n", + "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:56:02,425 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:56:07,411 - INFO - combo.training.trainer - Epoch duration: 0:01:21.127162\n", + "2023-04-07 00:56:07,412 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:02\n", + "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Epoch 93/399\n", + "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:56:07,413 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:56:07,422 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9622, LAS: 0.9221, UEM: 0.7398, LEM: 0.5281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1570, partial_loss/deprel_loss: 0.2857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5584, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||: 4%|3 | 4/111 [00:02<01:17, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9572, LAS: 0.9153, UEM: 0.6616, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.6086, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||: 7%|7 | 8/111 [00:05<01:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9590, LAS: 0.9168, UEM: 0.6598, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.3891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6018, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||: 10%|9 | 11/111 [00:07<01:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9566, LAS: 0.9156, UEM: 0.6450, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6822, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7548, loss: 0.6125, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||: 13%|#2 | 14/111 [00:09<01:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9550, LAS: 0.9141, UEM: 0.6348, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2216, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4626, loss: 0.6239, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||: 15%|#5 | 17/111 [00:11<01:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9546, LAS: 0.9142, UEM: 0.6136, LEM: 0.3776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.4792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6406, loss: 0.6247, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||: 19%|#8 | 21/111 [00:14<01:01, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9557, LAS: 0.9156, UEM: 0.6347, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4169, loss: 0.6161, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||: 23%|##2 | 25/111 [00:16<00:57, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9546, LAS: 0.9146, UEM: 0.6127, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3816, partial_loss/deprel_loss: 0.4059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 0.6273, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||: 26%|##6 | 29/111 [00:19<00:53, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9565, LAS: 0.9172, UEM: 0.6595, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1907, partial_loss/deprel_loss: 0.3468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.6083, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||: 29%|##8 | 32/111 [00:21<00:53, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9561, LAS: 0.9169, UEM: 0.6562, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.3134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.6078, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||: 32%|###2 | 36/111 [00:24<00:52, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9555, LAS: 0.9164, UEM: 0.6497, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7917, partial_loss/deprel_loss: 0.5317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7538, loss: 0.6085, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||: 35%|###5 | 39/111 [00:26<00:53, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9564, LAS: 0.9174, UEM: 0.6608, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4549, loss: 0.6001, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||: 38%|###7 | 42/111 [00:29<00:53, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9564, LAS: 0.9173, UEM: 0.6523, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.6016, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 41%|#### | 45/111 [00:31<00:49, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9561, LAS: 0.9169, UEM: 0.6436, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5652, loss: 0.6044, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 44%|####4 | 49/111 [00:34<00:44, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9565, LAS: 0.9175, UEM: 0.6450, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6009, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 48%|####7 | 53/111 [00:36<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9563, LAS: 0.9174, UEM: 0.6370, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.6023, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 50%|##### | 56/111 [00:38<00:38, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9566, LAS: 0.9178, UEM: 0.6402, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5124, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.6001, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 53%|#####3 | 59/111 [00:40<00:36, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9570, LAS: 0.9181, UEM: 0.6485, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5983, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 56%|#####5 | 62/111 [00:43<00:34, 1.42it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9567, LAS: 0.9178, UEM: 0.6434, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.5990, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 59%|#####8 | 65/111 [00:45<00:32, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9572, LAS: 0.9183, UEM: 0.6455, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4426, loss: 0.5950, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||: 61%|######1 | 68/111 [00:47<00:31, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9570, LAS: 0.9181, UEM: 0.6403, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5097, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 0.5962, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||: 64%|######3 | 71/111 [00:49<00:29, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9570, LAS: 0.9181, UEM: 0.6342, LEM: 0.4048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6196, partial_loss/deprel_loss: 0.5692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5984, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||: 68%|######8 | 76/111 [00:52<00:23, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9560, LAS: 0.9172, UEM: 0.6291, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9994, partial_loss/deprel_loss: 0.7024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9317, loss: 0.6070, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||: 73%|#######2 | 81/111 [00:54<00:18, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9563, LAS: 0.9174, UEM: 0.6301, LEM: 0.3992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6907, partial_loss/deprel_loss: 0.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.6059, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||: 77%|#######7 | 86/111 [00:57<00:14, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9553, LAS: 0.9163, UEM: 0.6202, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.5488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7185, loss: 0.6131, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||: 82%|########1 | 91/111 [00:59<00:10, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9557, LAS: 0.9167, UEM: 0.6267, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6865, loss: 0.6099, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||: 86%|########5 | 95/111 [01:02<00:09, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9554, LAS: 0.9163, UEM: 0.6206, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6465, partial_loss/deprel_loss: 0.5652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7514, loss: 0.6136, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||: 89%|########9 | 99/111 [01:05<00:07, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9553, LAS: 0.9162, UEM: 0.6243, LEM: 0.3965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1391, partial_loss/deprel_loss: 0.2918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6134, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||: 93%|#########2| 103/111 [01:07<00:05, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9549, LAS: 0.9158, UEM: 0.6186, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3359, partial_loss/deprel_loss: 0.4198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.6165, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 96%|#########6| 107/111 [01:10<00:02, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.389 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.301 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - reg_loss | 0.170 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - UEM | 0.614 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LAS | 0.915 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - loss | 0.619 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEM | 0.388 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:57:23,899 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:57:29,960 - INFO - combo.training.trainer - Epoch duration: 0:01:22.548285\n", + "2023-04-07 00:57:29,961 - INFO - combo.training.trainer - Estimated training time remaining: 6:55:44\n", + "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Epoch 94/399\n", + "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:57:29,962 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:57:29,970 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9521, LAS: 0.9133, UEM: 0.4149, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5899, loss: 0.6595, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 3%|2 | 3/111 [00:02<01:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9525, LAS: 0.9124, UEM: 0.4244, LEM: 0.1976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.6374, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 6%|6 | 7/111 [00:04<01:06, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9542, LAS: 0.9137, UEM: 0.4699, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.6316, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 10%|9 | 11/111 [00:06<01:03, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9548, LAS: 0.9140, UEM: 0.4912, LEM: 0.2354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5478, loss: 0.6281, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 13%|#2 | 14/111 [00:08<01:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9528, LAS: 0.9122, UEM: 0.4714, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7772, partial_loss/deprel_loss: 0.5558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7698, loss: 0.6451, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 16%|#6 | 18/111 [00:11<01:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9527, LAS: 0.9119, UEM: 0.4715, LEM: 0.2221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8692, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8445, loss: 0.6476, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 20%|#9 | 22/111 [00:13<00:57, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9716, UAS: 0.9558, LAS: 0.9159, UEM: 0.5880, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0331, partial_loss/deprel_loss: 0.1041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2597, loss: 0.6200, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 23%|##2 | 25/111 [00:16<00:59, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9549, LAS: 0.9152, UEM: 0.5827, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5290, partial_loss/deprel_loss: 0.4605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6231, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||: 25%|##5 | 28/111 [00:18<01:00, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9555, LAS: 0.9158, UEM: 0.5982, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.6142, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 28%|##7 | 31/111 [00:20<00:58, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9560, LAS: 0.9164, UEM: 0.6102, LEM: 0.3853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7661, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7543, loss: 0.6087, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 31%|### | 34/111 [00:23<00:56, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9562, LAS: 0.9169, UEM: 0.6093, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4293, loss: 0.6057, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 33%|###3 | 37/111 [00:25<00:54, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9176, UEM: 0.6248, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3037, partial_loss/deprel_loss: 0.3452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 0.6012, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 37%|###6 | 41/111 [00:28<00:49, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9555, LAS: 0.9159, UEM: 0.6103, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.5425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7178, loss: 0.6149, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 40%|###9 | 44/111 [00:30<00:46, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9549, LAS: 0.9153, UEM: 0.6039, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4688, loss: 0.6180, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 42%|####2 | 47/111 [00:32<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9551, LAS: 0.9155, UEM: 0.5987, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6414, partial_loss/deprel_loss: 0.5149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7099, loss: 0.6183, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 45%|####5 | 50/111 [00:34<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9556, LAS: 0.9162, UEM: 0.6107, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3878, loss: 0.6148, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 48%|####7 | 53/111 [00:36<00:41, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9538, LAS: 0.9145, UEM: 0.6052, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.6253, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||: 50%|##### | 56/111 [00:38<00:38, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9546, LAS: 0.9152, UEM: 0.6152, LEM: 0.3848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1899, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.6189, batch_reg_loss: 0.1697, reg_loss: 0.1697 ||: 55%|#####4 | 61/111 [00:40<00:31, 1.58it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9545, LAS: 0.9149, UEM: 0.6062, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 0.6216, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 59%|#####9 | 66/111 [00:43<00:26, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9538, LAS: 0.9138, UEM: 0.6011, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0929, partial_loss/deprel_loss: 0.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.6295, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 64%|######3 | 71/111 [00:45<00:22, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9542, LAS: 0.9143, UEM: 0.6086, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.6262, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 68%|######7 | 75/111 [00:48<00:20, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9537, LAS: 0.9138, UEM: 0.6020, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 71%|#######1 | 79/111 [00:50<00:18, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9539, LAS: 0.9140, UEM: 0.5997, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.6113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7987, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 75%|#######4 | 83/111 [00:53<00:16, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9544, LAS: 0.9147, UEM: 0.6118, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4641, loss: 0.6233, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 78%|#######8 | 87/111 [00:56<00:15, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9549, LAS: 0.9153, UEM: 0.6189, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5173, partial_loss/deprel_loss: 0.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6860, loss: 0.6188, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 82%|########1 | 91/111 [00:58<00:13, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9545, LAS: 0.9148, UEM: 0.6184, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6372, partial_loss/deprel_loss: 0.7892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1283, loss: 0.6222, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 86%|########5 | 95/111 [01:01<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9547, LAS: 0.9150, UEM: 0.6189, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2109, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4635, loss: 0.6209, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||: 88%|########8 | 98/111 [01:04<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9547, LAS: 0.9151, UEM: 0.6162, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.6197, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 92%|#########1| 102/111 [01:06<00:06, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9550, LAS: 0.9154, UEM: 0.6205, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6481, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 95%|#########5| 106/111 [01:09<00:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9547, LAS: 0.9151, UEM: 0.6143, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3580, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5671, loss: 0.6200, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 99%|#########9| 110/111 [01:11<00:00, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9550, LAS: 0.9155, UEM: 0.6235, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0758, partial_loss/deprel_loss: 0.1748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3245, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.175 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.076 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - reg_loss | 0.170 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UEM | 0.624 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LAS | 0.915 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - loss | 0.617 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEM | 0.391 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - EM | 0.957 | N/A\n", + "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 00:58:45,479 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 00:58:50,382 - INFO - combo.training.trainer - Epoch duration: 0:01:20.421411\n", + "2023-04-07 00:58:50,383 - INFO - combo.training.trainer - Estimated training time remaining: 6:54:19\n", + "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Epoch 95/399\n", + "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 00:58:50,384 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 00:58:50,393 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9403, LAS: 0.8966, UEM: 0.2033, LEM: 0.0664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7028, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8098, loss: 0.7676, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 3%|2 | 3/111 [00:02<01:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9443, LAS: 0.9015, UEM: 0.2599, LEM: 0.0791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7219, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 5%|5 | 6/111 [00:04<01:13, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9452, LAS: 0.9049, UEM: 0.4647, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4022, loss: 0.6918, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 8%|8 | 9/111 [00:06<01:11, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9517, LAS: 0.9121, UEM: 0.5362, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.6405, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 12%|#1 | 13/111 [00:08<01:05, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9501, LAS: 0.9100, UEM: 0.5007, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4803, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.6529, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 14%|#4 | 16/111 [00:10<01:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9510, LAS: 0.9112, UEM: 0.5359, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.6384, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||: 17%|#7 | 19/111 [00:13<01:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9515, LAS: 0.9117, UEM: 0.5425, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.6385, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||: 21%|## | 23/111 [00:15<00:59, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9527, LAS: 0.9131, UEM: 0.5493, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4411, partial_loss/deprel_loss: 0.4339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.6308, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||: 23%|##3 | 26/111 [00:17<00:58, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9513, LAS: 0.9119, UEM: 0.5297, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6417, partial_loss/deprel_loss: 0.5229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.6360, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||: 26%|##6 | 29/111 [00:19<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9521, LAS: 0.9128, UEM: 0.5411, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6245, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.6294, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||: 29%|##8 | 32/111 [00:22<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9525, LAS: 0.9133, UEM: 0.5363, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4648, partial_loss/deprel_loss: 0.4901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6544, loss: 0.6274, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||: 32%|###1 | 35/111 [00:24<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9525, LAS: 0.9130, UEM: 0.5261, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7316, loss: 0.6312, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 35%|###5 | 39/111 [00:26<00:49, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9537, LAS: 0.9144, UEM: 0.5419, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.6227, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 39%|###8 | 43/111 [00:28<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9520, LAS: 0.9128, UEM: 0.5411, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.3025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.6364, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 42%|####2 | 47/111 [00:30<00:38, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9530, LAS: 0.9136, UEM: 0.5572, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4463, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.6296, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||: 46%|####5 | 51/111 [00:33<00:34, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9539, LAS: 0.9149, UEM: 0.5827, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6151, partial_loss/deprel_loss: 0.5066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.6191, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 50%|##### | 56/111 [00:35<00:30, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9541, LAS: 0.9150, UEM: 0.5864, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.6187, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 54%|#####4 | 60/111 [00:38<00:29, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9704, UAS: 0.9552, LAS: 0.9164, UEM: 0.6180, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0377, partial_loss/deprel_loss: 0.1045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2604, loss: 0.6088, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 58%|#####7 | 64/111 [00:41<00:32, 1.45it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9551, LAS: 0.9162, UEM: 0.6103, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.6092, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 61%|######1 | 68/111 [00:44<00:28, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9553, LAS: 0.9164, UEM: 0.6085, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2413, partial_loss/deprel_loss: 0.3382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6091, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 65%|######4 | 72/111 [00:46<00:24, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9551, LAS: 0.9161, UEM: 0.6072, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.6118, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 68%|######8 | 76/111 [00:49<00:22, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9546, LAS: 0.9153, UEM: 0.6000, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6490, partial_loss/deprel_loss: 0.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8118, loss: 0.6166, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||: 72%|#######2 | 80/111 [00:51<00:20, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9547, LAS: 0.9156, UEM: 0.5963, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2473, partial_loss/deprel_loss: 0.3526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.6157, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||: 76%|#######5 | 84/111 [00:54<00:18, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9548, LAS: 0.9158, UEM: 0.5937, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2914, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.6155, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||: 79%|#######9 | 88/111 [00:58<00:16, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9547, LAS: 0.9157, UEM: 0.5955, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2497, partial_loss/deprel_loss: 0.3107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4677, loss: 0.6151, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||: 82%|########1 | 91/111 [01:00<00:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9548, LAS: 0.9158, UEM: 0.5948, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6732, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8022, loss: 0.6142, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||: 86%|########5 | 95/111 [01:02<00:10, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9550, LAS: 0.9159, UEM: 0.5965, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1758, partial_loss/deprel_loss: 0.2661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.6134, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||: 89%|########9 | 99/111 [01:05<00:07, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9549, LAS: 0.9159, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2254, partial_loss/deprel_loss: 0.3636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.6133, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 93%|#########2| 103/111 [01:07<00:05, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9552, LAS: 0.9162, UEM: 0.6069, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2262, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6110, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 96%|#########6| 107/111 [01:09<00:02, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:00:06,571 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9433, LAS: 0.8922, UEM: 0.5839, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3625, partial_loss/deprel_loss: 45.9887, partial_loss/cycle_loss: 0.0000, batch_loss: 37.0634, loss: 28.0423, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:03<00:10, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9475, LAS: 0.8973, UEM: 0.5948, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5580, partial_loss/deprel_loss: 23.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9084, loss: 23.4430, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9461, LAS: 0.8943, UEM: 0.5695, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1060, partial_loss/deprel_loss: 41.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 33.3602, loss: 24.6334, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9013, UEM: 0.6730, LEM: 0.4032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 22.7933, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2673, loss: 23.1488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9464, LAS: 0.8957, UEM: 0.6553, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6588, partial_loss/deprel_loss: 54.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 43.8111, loss: 24.7382, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.02it/s]\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.155 | 54.349\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.081 | 1.659\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - reg_loss | 0.169 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UEM | 0.622 | 0.655\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LAS | 0.917 | 0.896\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - loss | 0.606 | 24.738\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEM | 0.393 | 0.392\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | 0.946\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EM | 0.955 | 0.830\n", + "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:00:19,341 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:00:24,554 - INFO - combo.training.trainer - Epoch duration: 0:01:34.171200\n", + "2023-04-07 01:00:24,555 - INFO - combo.training.trainer - Estimated training time remaining: 6:53:37\n", + "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Epoch 96/399\n", + "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:00:24,562 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9391, LAS: 0.8974, UEM: 0.2827, LEM: 0.1307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7643, partial_loss/deprel_loss: 0.5785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7848, loss: 0.7524, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||: 4%|3 | 4/111 [00:02<01:00, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9463, LAS: 0.9054, UEM: 0.4872, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7313, partial_loss/deprel_loss: 0.5896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.6933, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 8%|8 | 9/111 [00:04<00:56, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9499, LAS: 0.9104, UEM: 0.5896, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.6497, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 11%|# | 12/111 [00:07<01:00, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9503, LAS: 0.9112, UEM: 0.5665, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.5445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7201, loss: 0.6425, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 14%|#4 | 16/111 [00:09<00:55, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9521, LAS: 0.9129, UEM: 0.5732, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.4542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.6335, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 17%|#7 | 19/111 [00:11<00:56, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9524, LAS: 0.9133, UEM: 0.5812, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 0.5797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 0.6279, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 21%|## | 23/111 [00:13<00:54, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9520, LAS: 0.9131, UEM: 0.5641, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.3722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6309, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 24%|##4 | 27/111 [00:15<00:50, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9548, LAS: 0.9162, UEM: 0.6015, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6343, loss: 0.6099, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 29%|##8 | 32/111 [00:18<00:43, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9558, LAS: 0.9175, UEM: 0.6238, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.6023, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||: 33%|###3 | 37/111 [00:20<00:40, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9561, LAS: 0.9177, UEM: 0.6109, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2981, partial_loss/deprel_loss: 0.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5634, loss: 0.6028, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 37%|###6 | 41/111 [00:23<00:39, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9546, LAS: 0.9165, UEM: 0.6138, LEM: 0.3904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2492, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.6106, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 41%|#### | 45/111 [00:26<00:42, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9550, LAS: 0.9170, UEM: 0.6111, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6034, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6605, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 44%|####4 | 49/111 [00:29<00:39, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9554, LAS: 0.9174, UEM: 0.6144, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.4575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6211, loss: 0.6032, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 48%|####7 | 53/111 [00:31<00:37, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9550, LAS: 0.9167, UEM: 0.6106, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6086, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.6088, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 51%|#####1 | 57/111 [00:34<00:35, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9552, LAS: 0.9167, UEM: 0.6143, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.5003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.6087, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 55%|#####4 | 61/111 [00:37<00:33, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9551, LAS: 0.9167, UEM: 0.6094, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4728, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6072, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 59%|#####8 | 65/111 [00:39<00:29, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9551, LAS: 0.9168, UEM: 0.6119, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1561, partial_loss/deprel_loss: 0.2667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||: 62%|######2 | 69/111 [00:42<00:26, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9551, LAS: 0.9169, UEM: 0.6096, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5493, loss: 0.6053, batch_reg_loss: 0.1689, reg_loss: 0.1691 ||: 66%|######5 | 73/111 [00:44<00:24, 1.54it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9560, LAS: 0.9179, UEM: 0.6290, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2955, partial_loss/deprel_loss: 0.3446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.5985, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 69%|######9 | 77/111 [00:47<00:23, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9564, LAS: 0.9185, UEM: 0.6391, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.4909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6723, loss: 0.5941, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 72%|#######2 | 80/111 [00:50<00:21, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9565, LAS: 0.9185, UEM: 0.6354, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5767, loss: 0.5948, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 76%|#######5 | 84/111 [00:52<00:17, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9563, LAS: 0.9183, UEM: 0.6299, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2253, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.5979, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 79%|#######9 | 88/111 [00:55<00:15, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9556, LAS: 0.9175, UEM: 0.6254, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.4963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.6032, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 83%|########2 | 92/111 [00:58<00:13, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9555, LAS: 0.9173, UEM: 0.6257, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5814, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7091, loss: 0.6043, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 86%|########6 | 96/111 [01:00<00:09, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9556, LAS: 0.9175, UEM: 0.6248, LEM: 0.4004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4346, loss: 0.6037, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||: 90%|######### | 100/111 [01:03<00:07, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9557, LAS: 0.9176, UEM: 0.6292, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9167, partial_loss/deprel_loss: 0.6152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8444, loss: 0.6018, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||: 94%|#########3| 104/111 [01:06<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9550, LAS: 0.9170, UEM: 0.6240, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4594, loss: 0.6050, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||: 97%|#########7| 108/111 [01:08<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9550, LAS: 0.9168, UEM: 0.6213, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6063, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||: 100%|##########| 111/111 [01:10<00:00, 1.57it/s]\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.426 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.243 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - reg_loss | 0.169 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UEM | 0.621 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - LAS | 0.917 | N/A\n", + "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - loss | 0.606 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEM | 0.397 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - UAS | 0.955 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EM | 0.920 | N/A\n", + "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:01:38,123 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:01:41,735 - INFO - combo.training.trainer - Epoch duration: 0:01:17.180312\n", + "2023-04-07 01:01:41,736 - INFO - combo.training.trainer - Estimated training time remaining: 6:52:02\n", + "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Epoch 97/399\n", + "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:01:41,737 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:01:41,751 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9528, LAS: 0.9152, UEM: 0.4238, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.6364, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||: 4%|3 | 4/111 [00:02<01:05, 1.63it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9571, LAS: 0.9196, UEM: 0.4810, LEM: 0.2370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3336, partial_loss/deprel_loss: 0.3597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5891, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||: 7%|7 | 8/111 [00:04<01:00, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9574, LAS: 0.9207, UEM: 0.5548, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2063, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4427, loss: 0.5791, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||: 12%|#1 | 13/111 [00:06<00:54, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9551, LAS: 0.9179, UEM: 0.5253, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4222, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.6009, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||: 16%|#6 | 18/111 [00:09<00:48, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9556, LAS: 0.9183, UEM: 0.5201, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5889, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5964, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||: 21%|## | 23/111 [00:11<00:44, 1.99it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9550, LAS: 0.9174, UEM: 0.5125, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7134, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 24%|##4 | 27/111 [00:14<00:45, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9525, LAS: 0.9149, UEM: 0.5015, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7814, loss: 0.6175, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 28%|##7 | 31/111 [00:16<00:46, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9539, LAS: 0.9157, UEM: 0.5416, LEM: 0.3111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.6092, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 32%|###1 | 35/111 [00:19<00:47, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9550, LAS: 0.9171, UEM: 0.5771, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1882, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5997, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 35%|###5 | 39/111 [00:22<00:47, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9541, LAS: 0.9158, UEM: 0.5798, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0605, partial_loss/deprel_loss: 0.7466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9781, loss: 0.6078, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 39%|###8 | 43/111 [00:25<00:47, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9541, LAS: 0.9158, UEM: 0.5736, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5492, partial_loss/deprel_loss: 0.4876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.6089, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 42%|####2 | 47/111 [00:28<00:43, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9544, LAS: 0.9162, UEM: 0.5777, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.6079, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||: 45%|####5 | 50/111 [00:30<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9539, LAS: 0.9156, UEM: 0.5682, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.4453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.6127, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||: 49%|####8 | 54/111 [00:32<00:38, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9547, LAS: 0.9161, UEM: 0.5806, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6084, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||: 52%|#####2 | 58/111 [00:35<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9558, LAS: 0.9174, UEM: 0.6119, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||: 56%|#####5 | 62/111 [00:39<00:36, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9561, LAS: 0.9176, UEM: 0.6116, LEM: 0.3917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4259, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.5979, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 59%|#####8 | 65/111 [00:41<00:34, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9558, LAS: 0.9175, UEM: 0.6148, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.5995, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 61%|######1 | 68/111 [00:43<00:32, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9559, LAS: 0.9177, UEM: 0.6136, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1631, partial_loss/deprel_loss: 0.2949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5977, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 64%|######3 | 71/111 [00:45<00:30, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9551, LAS: 0.9166, UEM: 0.6049, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6042, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 67%|######6 | 74/111 [00:47<00:26, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9549, LAS: 0.9165, UEM: 0.6025, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6400, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.6049, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 70%|####### | 78/111 [00:50<00:23, 1.40it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9559, LAS: 0.9177, UEM: 0.6219, LEM: 0.4045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1427, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3704, loss: 0.5963, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 74%|#######3 | 82/111 [00:53<00:19, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9562, LAS: 0.9179, UEM: 0.6242, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6873, loss: 0.5945, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 77%|#######6 | 85/111 [00:55<00:17, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9559, LAS: 0.9177, UEM: 0.6176, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4235, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5915, loss: 0.5972, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 80%|######## | 89/111 [00:57<00:14, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9562, LAS: 0.9180, UEM: 0.6208, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.5943, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||: 84%|########3 | 93/111 [01:00<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9562, LAS: 0.9179, UEM: 0.6276, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8061, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.5943, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 87%|########7 | 97/111 [01:03<00:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9561, LAS: 0.9178, UEM: 0.6256, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.5947, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 91%|######### | 101/111 [01:06<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9560, LAS: 0.9177, UEM: 0.6224, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.3745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5384, loss: 0.5959, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 94%|#########3| 104/111 [01:08<00:04, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9560, LAS: 0.9176, UEM: 0.6200, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.5966, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 96%|#########6| 107/111 [01:10<00:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9562, LAS: 0.9178, UEM: 0.6249, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.5948, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 99%|#########9| 110/111 [01:12<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9563, LAS: 0.9179, UEM: 0.6249, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2849, partial_loss/deprel_loss: 0.3783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5942, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:02:57,808 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.378 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.285 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - reg_loss | 0.169 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UEM | 0.625 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - LAS | 0.918 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - loss | 0.594 | N/A\n", + "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEM | 0.404 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - UAS | 0.956 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EM | 0.929 | N/A\n", + "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:02:57,814 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:03:02,067 - INFO - combo.training.trainer - Epoch duration: 0:01:20.331514\n", + "2023-04-07 01:03:02,068 - INFO - combo.training.trainer - Estimated training time remaining: 6:50:36\n", + "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Epoch 98/399\n", + "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:03:02,069 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:03:02,078 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9541, LAS: 0.9186, UEM: 0.5242, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5159, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6171, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||: 5%|4 | 5/111 [00:02<00:44, 2.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9624, LAS: 0.9276, UEM: 0.7138, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0722, partial_loss/deprel_loss: 0.1715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3201, loss: 0.5430, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||: 8%|8 | 9/111 [00:04<00:45, 2.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9602, LAS: 0.9251, UEM: 0.6759, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4794, loss: 0.5607, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||: 12%|#1 | 13/111 [00:06<00:47, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9616, LAS: 0.9257, UEM: 0.6847, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1678, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4282, loss: 0.5542, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||: 14%|#4 | 16/111 [00:08<00:56, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9788, UAS: 0.9625, LAS: 0.9276, UEM: 0.7210, LEM: 0.5319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0258, partial_loss/deprel_loss: 0.0861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2424, loss: 0.5429, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||: 17%|#7 | 19/111 [00:11<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9600, LAS: 0.9245, UEM: 0.6866, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.5636, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||: 21%|## | 23/111 [00:14<00:59, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9593, LAS: 0.9240, UEM: 0.6749, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.5654, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||: 23%|##3 | 26/111 [00:16<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9578, LAS: 0.9217, UEM: 0.6691, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5636, partial_loss/deprel_loss: 0.5041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.5787, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||: 27%|##7 | 30/111 [00:18<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9563, LAS: 0.9197, UEM: 0.6634, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8457, loss: 0.5912, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||: 31%|### | 34/111 [00:21<00:50, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9540, LAS: 0.9172, UEM: 0.6384, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7668, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.6081, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||: 34%|###4 | 38/111 [00:23<00:47, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9545, LAS: 0.9177, UEM: 0.6341, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6419, partial_loss/deprel_loss: 0.4970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6943, loss: 0.6035, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||: 38%|###7 | 42/111 [00:26<00:44, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9552, LAS: 0.9182, UEM: 0.6314, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5426, partial_loss/deprel_loss: 0.5139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6880, loss: 0.5989, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||: 41%|####1 | 46/111 [00:29<00:42, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9548, LAS: 0.9177, UEM: 0.6174, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2994, partial_loss/deprel_loss: 0.4110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.6036, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||: 45%|####5 | 50/111 [00:31<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9551, LAS: 0.9179, UEM: 0.6165, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.3967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.6012, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 48%|####7 | 53/111 [00:33<00:38, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9557, LAS: 0.9184, UEM: 0.6215, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2372, partial_loss/deprel_loss: 0.3011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5959, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 50%|##### | 56/111 [00:35<00:36, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9561, LAS: 0.9188, UEM: 0.6278, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.5927, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 53%|#####3 | 59/111 [00:38<00:36, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9563, LAS: 0.9188, UEM: 0.6229, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3157, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5441, loss: 0.5923, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 56%|#####5 | 62/111 [00:40<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9559, LAS: 0.9182, UEM: 0.6228, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.5966, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 59%|#####8 | 65/111 [00:42<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9560, LAS: 0.9184, UEM: 0.6212, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1784, partial_loss/deprel_loss: 0.2485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4028, loss: 0.5939, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 62%|######2 | 69/111 [00:45<00:29, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9566, LAS: 0.9191, UEM: 0.6341, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1107, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5892, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 65%|######4 | 72/111 [00:47<00:28, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9566, LAS: 0.9189, UEM: 0.6289, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.5898, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 68%|######8 | 76/111 [00:50<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9195, UEM: 0.6385, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.3700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5858, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 71%|#######1 | 79/111 [00:52<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9571, LAS: 0.9194, UEM: 0.6355, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.5865, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||: 74%|#######3 | 82/111 [00:54<00:21, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9572, LAS: 0.9194, UEM: 0.6377, LEM: 0.4172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2213, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4880, loss: 0.5859, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||: 77%|#######6 | 85/111 [00:57<00:19, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9567, LAS: 0.9189, UEM: 0.6401, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1453, partial_loss/deprel_loss: 0.6996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9569, loss: 0.5903, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||: 79%|#######9 | 88/111 [00:59<00:17, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9568, LAS: 0.9189, UEM: 0.6360, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4078, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.5904, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||: 82%|########1 | 91/111 [01:01<00:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9564, LAS: 0.9184, UEM: 0.6309, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6180, partial_loss/deprel_loss: 0.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7107, loss: 0.5933, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||: 86%|########5 | 95/111 [01:03<00:11, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9568, LAS: 0.9188, UEM: 0.6325, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6260, partial_loss/deprel_loss: 0.5665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.5919, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 89%|########9 | 99/111 [01:06<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9567, LAS: 0.9188, UEM: 0.6271, LEM: 0.4056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4285, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.5936, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 93%|#########2| 103/111 [01:08<00:05, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9573, LAS: 0.9193, UEM: 0.6311, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4122, loss: 0.5898, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 96%|#########6| 107/111 [01:10<00:02, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9572, LAS: 0.9193, UEM: 0.6285, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.5914, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.426 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.320 | N/A\n", + "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - reg_loss | 0.168 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UEM | 0.628 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LAS | 0.919 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - loss | 0.591 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEM | 0.404 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EM | 0.927 | N/A\n", + "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:04:18,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Epoch duration: 0:01:21.530588\n", + "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Estimated training time remaining: 6:49:15\n", + "2023-04-07 01:04:23,599 - INFO - allennlp.training.trainer - Epoch 99/399\n", + "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:04:23,610 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9617, LAS: 0.9249, UEM: 0.5893, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4106, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5332, batch_reg_loss: 0.1681, reg_loss: 0.1682 ||: 4%|3 | 4/111 [00:02<01:07, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9595, LAS: 0.9213, UEM: 0.6843, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.2754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4223, loss: 0.5445, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 6%|6 | 7/111 [00:05<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9636, LAS: 0.9278, UEM: 0.7559, LEM: 0.5669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4117, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.5165, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 9%|9 | 10/111 [00:07<01:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9641, LAS: 0.9285, UEM: 0.7408, LEM: 0.5375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3300, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5475, loss: 0.5127, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 12%|#1 | 13/111 [00:09<01:13, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9580, LAS: 0.9216, UEM: 0.7034, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6043, partial_loss/deprel_loss: 0.5621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5675, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 15%|#5 | 17/111 [00:12<01:08, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9556, LAS: 0.9192, UEM: 0.6625, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7397, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7573, loss: 0.5879, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 19%|#8 | 21/111 [00:15<01:02, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9563, LAS: 0.9201, UEM: 0.6492, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2487, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.5868, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 23%|##2 | 25/111 [00:17<00:57, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9579, LAS: 0.9217, UEM: 0.6643, LEM: 0.4489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1325, partial_loss/deprel_loss: 0.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4171, loss: 0.5753, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 26%|##6 | 29/111 [00:19<00:53, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9570, LAS: 0.9207, UEM: 0.6437, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5556, loss: 0.5883, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||: 30%|##9 | 33/111 [00:22<00:51, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9567, LAS: 0.9202, UEM: 0.6330, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.5906, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 33%|###3 | 37/111 [00:25<00:48, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9578, LAS: 0.9212, UEM: 0.6431, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4669, loss: 0.5836, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 36%|###6 | 40/111 [00:27<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9584, LAS: 0.9217, UEM: 0.6527, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3646, loss: 0.5801, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 39%|###8 | 43/111 [00:29<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9586, LAS: 0.9219, UEM: 0.6642, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6093, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.5771, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 41%|####1 | 46/111 [00:32<00:47, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9580, LAS: 0.9211, UEM: 0.6541, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5288, loss: 0.5832, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 45%|####5 | 50/111 [00:34<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9584, LAS: 0.9217, UEM: 0.6583, LEM: 0.4435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5790, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 49%|####8 | 54/111 [00:37<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9592, LAS: 0.9225, UEM: 0.6651, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.5727, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 52%|#####2 | 58/111 [00:39<00:34, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9223, UEM: 0.6643, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1708, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5735, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 56%|#####5 | 62/111 [00:42<00:33, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9582, LAS: 0.9212, UEM: 0.6523, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7255, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.5811, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||: 59%|#####9 | 66/111 [00:44<00:29, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9577, LAS: 0.9206, UEM: 0.6417, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5670, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6838, loss: 0.5851, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 63%|######3 | 70/111 [00:47<00:26, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9571, LAS: 0.9201, UEM: 0.6357, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6575, loss: 0.5889, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 67%|######6 | 74/111 [00:50<00:25, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9568, LAS: 0.9196, UEM: 0.6329, LEM: 0.4119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5904, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 69%|######9 | 77/111 [00:53<00:25, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9567, LAS: 0.9194, UEM: 0.6282, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4504, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.5918, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 72%|#######2 | 80/111 [00:55<00:22, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9568, LAS: 0.9194, UEM: 0.6270, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.5915, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 75%|#######4 | 83/111 [00:57<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9567, LAS: 0.9193, UEM: 0.6383, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1086, partial_loss/deprel_loss: 0.2315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3748, loss: 0.5910, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 77%|#######7 | 86/111 [00:59<00:19, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9568, LAS: 0.9194, UEM: 0.6343, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.5909, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 81%|########1 | 90/111 [01:02<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9200, UEM: 0.6318, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3063, partial_loss/deprel_loss: 0.3247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5869, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 86%|########5 | 95/111 [01:04<00:10, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9572, LAS: 0.9199, UEM: 0.6300, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.3539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.5871, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||: 90%|######### | 100/111 [01:06<00:06, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9572, LAS: 0.9199, UEM: 0.6342, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1752, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5868, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||: 95%|#########4| 105/111 [01:09<00:03, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9574, LAS: 0.9199, UEM: 0.6347, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4555, loss: 0.5861, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||: 98%|#########8| 109/111 [01:12<00:01, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9198, UEM: 0.6335, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5870, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:05:40,141 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.347 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.218 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - reg_loss | 0.168 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UEM | 0.633 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LAS | 0.920 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - loss | 0.587 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEM | 0.406 | N/A\n", + "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EM | 0.935 | N/A\n", + "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:05:40,148 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Epoch duration: 0:01:21.518221\n", + "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:53\n", + "2023-04-07 01:05:45,118 - INFO - allennlp.training.trainer - Epoch 100/399\n", + "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:05:45,132 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9520, LAS: 0.9132, UEM: 0.6094, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6790, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7076, loss: 0.6213, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||: 4%|3 | 4/111 [00:02<01:06, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9586, LAS: 0.9210, UEM: 0.6494, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6368, loss: 0.5710, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||: 6%|6 | 7/111 [00:05<01:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9576, LAS: 0.9206, UEM: 0.5918, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6072, loss: 0.5797, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||: 10%|9 | 11/111 [00:07<01:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9606, LAS: 0.9235, UEM: 0.6388, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.3501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5600, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||: 13%|#2 | 14/111 [00:09<01:05, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9246, UEM: 0.6601, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.5466, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||: 15%|#5 | 17/111 [00:11<01:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9631, LAS: 0.9255, UEM: 0.6556, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.3960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5311, loss: 0.5455, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||: 19%|#8 | 21/111 [00:14<00:59, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9625, LAS: 0.9246, UEM: 0.6400, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4028, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5531, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||: 23%|##2 | 25/111 [00:16<00:56, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9613, LAS: 0.9235, UEM: 0.6279, LEM: 0.3736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5770, loss: 0.5629, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||: 26%|##6 | 29/111 [00:19<00:52, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9605, LAS: 0.9226, UEM: 0.6154, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5035, loss: 0.5694, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||: 30%|##9 | 33/111 [00:21<00:50, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9584, LAS: 0.9204, UEM: 0.5967, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0388, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.5841, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||: 33%|###3 | 37/111 [00:24<00:47, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9586, LAS: 0.9211, UEM: 0.6047, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3691, partial_loss/deprel_loss: 0.3959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 0.5811, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||: 37%|###6 | 41/111 [00:26<00:44, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9586, LAS: 0.9207, UEM: 0.6054, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4260, loss: 0.5829, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||: 41%|#### | 45/111 [00:29<00:41, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9592, LAS: 0.9213, UEM: 0.6040, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2283, partial_loss/deprel_loss: 0.3198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.5803, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||: 44%|####4 | 49/111 [00:31<00:38, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9581, LAS: 0.9202, UEM: 0.5987, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2588, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5069, loss: 0.5898, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||: 48%|####7 | 53/111 [00:34<00:36, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9587, LAS: 0.9208, UEM: 0.6148, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 51%|#####1 | 57/111 [00:36<00:33, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9587, LAS: 0.9209, UEM: 0.6090, LEM: 0.3644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6407, loss: 0.5827, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 55%|#####4 | 61/111 [00:39<00:30, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9588, LAS: 0.9210, UEM: 0.6164, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.5814, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 59%|#####8 | 65/111 [00:42<00:30, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9596, LAS: 0.9221, UEM: 0.6403, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4319, loss: 0.5750, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 62%|######2 | 69/111 [00:45<00:31, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9595, LAS: 0.9220, UEM: 0.6402, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5404, partial_loss/deprel_loss: 0.5082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.5753, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 65%|######4 | 72/111 [00:47<00:28, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9578, LAS: 0.9204, UEM: 0.6296, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.5256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 0.5868, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 68%|######8 | 76/111 [00:50<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9583, LAS: 0.9208, UEM: 0.6404, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 72%|#######2 | 80/111 [00:52<00:20, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9581, LAS: 0.9206, UEM: 0.6366, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5347, loss: 0.5845, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||: 76%|#######5 | 84/111 [00:54<00:16, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9580, LAS: 0.9205, UEM: 0.6320, LEM: 0.4065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7726, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.5854, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||: 79%|#######9 | 88/111 [00:59<00:18, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9584, LAS: 0.9209, UEM: 0.6349, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4949, partial_loss/deprel_loss: 0.5901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5834, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||: 83%|########2 | 92/111 [01:01<00:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9585, LAS: 0.9210, UEM: 0.6396, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5819, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||: 86%|########6 | 96/111 [01:03<00:10, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9583, LAS: 0.9208, UEM: 0.6358, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.5829, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||: 91%|######### | 101/111 [01:06<00:06, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9589, LAS: 0.9215, UEM: 0.6489, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.2605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5776, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||: 95%|#########4| 105/111 [01:08<00:03, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9582, LAS: 0.9207, UEM: 0.6415, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4188, partial_loss/deprel_loss: 0.4373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6011, loss: 0.5831, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||: 98%|#########8| 109/111 [01:10<00:01, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9578, LAS: 0.9203, UEM: 0.6389, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3320, partial_loss/deprel_loss: 0.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5622, loss: 0.5859, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||: 100%|##########| 111/111 [01:11<00:00, 1.55it/s]\n", + "2023-04-07 01:07:00,073 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9546, LAS: 0.9047, UEM: 0.6395, LEM: 0.3262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4405, partial_loss/deprel_loss: 24.0473, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3259, loss: 22.2299, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.10it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9455, LAS: 0.8921, UEM: 0.5202, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9855, partial_loss/deprel_loss: 35.7936, partial_loss/cycle_loss: 0.0000, batch_loss: 28.8320, loss: 23.8770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9455, LAS: 0.8928, UEM: 0.5466, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 46.5675, partial_loss/cycle_loss: 0.0000, batch_loss: 37.5207, loss: 25.1771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9443, LAS: 0.8922, UEM: 0.5920, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7122, partial_loss/deprel_loss: 54.8760, partial_loss/cycle_loss: 0.0000, batch_loss: 44.2433, loss: 25.7398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9467, LAS: 0.8962, UEM: 0.6526, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 33.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 27.0014, loss: 24.9927, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.02it/s]\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.410 | 33.573\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.332 | 0.715\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - reg_loss | 0.168 | 0.000\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UEM | 0.639 | 0.653\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LAS | 0.920 | 0.896\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - loss | 0.586 | 24.993\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEM | 0.411 | 0.392\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | 0.947\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EM | 0.922 | 0.888\n", + "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:07:12,774 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Epoch duration: 0:01:32.751562\n", + "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:04\n", + "2023-04-07 01:07:17,870 - INFO - allennlp.training.trainer - Epoch 101/399\n", + "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:07:17,886 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9584, LAS: 0.9224, UEM: 0.5521, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.5687, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||: 4%|3 | 4/111 [00:02<01:07, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9619, LAS: 0.9268, UEM: 0.5710, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5421, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||: 6%|6 | 7/111 [00:04<01:08, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9637, LAS: 0.9273, UEM: 0.6240, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.3880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.5432, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||: 10%|9 | 11/111 [00:07<01:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9639, LAS: 0.9273, UEM: 0.6749, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7485, partial_loss/deprel_loss: 0.5903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.5387, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||: 13%|#2 | 14/111 [00:09<01:08, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9642, LAS: 0.9277, UEM: 0.6725, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1768, partial_loss/deprel_loss: 0.3002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.5336, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||: 15%|#5 | 17/111 [00:11<01:05, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9644, LAS: 0.9284, UEM: 0.6859, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.3348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5291, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 18%|#8 | 20/111 [00:13<01:03, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9625, LAS: 0.9264, UEM: 0.6755, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8730, partial_loss/deprel_loss: 0.5417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7753, loss: 0.5407, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 22%|##1 | 24/111 [00:16<00:58, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9616, LAS: 0.9251, UEM: 0.6596, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4606, loss: 0.5484, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 25%|##5 | 28/111 [00:18<00:54, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9613, LAS: 0.9247, UEM: 0.6721, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1284, partial_loss/deprel_loss: 0.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3892, loss: 0.5513, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 28%|##7 | 31/111 [00:21<00:55, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9605, LAS: 0.9233, UEM: 0.6628, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3010, partial_loss/deprel_loss: 0.4006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5480, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 32%|###1 | 35/111 [00:23<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9603, LAS: 0.9233, UEM: 0.6703, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 0.5819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7936, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 34%|###4 | 38/111 [00:26<00:51, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9592, LAS: 0.9221, UEM: 0.6568, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.5733, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||: 38%|###7 | 42/111 [00:28<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9601, LAS: 0.9232, UEM: 0.6750, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.5658, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 41%|#### | 45/111 [00:30<00:47, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9595, LAS: 0.9226, UEM: 0.6701, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1848, partial_loss/deprel_loss: 0.2736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5682, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 43%|####3 | 48/111 [00:33<00:46, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9591, LAS: 0.9219, UEM: 0.6620, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.5704, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 47%|####6 | 52/111 [00:35<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9588, LAS: 0.9216, UEM: 0.6517, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2664, partial_loss/deprel_loss: 0.3243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4800, loss: 0.5722, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 51%|#####1 | 57/111 [00:38<00:34, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9581, LAS: 0.9209, UEM: 0.6493, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7026, partial_loss/deprel_loss: 0.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7663, loss: 0.5773, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 55%|#####4 | 61/111 [00:40<00:30, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9588, LAS: 0.9219, UEM: 0.6482, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.2670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5711, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 59%|#####9 | 66/111 [00:42<00:24, 1.83it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9582, LAS: 0.9211, UEM: 0.6423, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4466, partial_loss/deprel_loss: 0.4426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6107, loss: 0.5769, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 63%|######3 | 70/111 [00:44<00:21, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9577, LAS: 0.9206, UEM: 0.6412, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3618, partial_loss/deprel_loss: 0.7365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0288, loss: 0.5812, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 67%|######6 | 74/111 [00:47<00:21, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9579, LAS: 0.9208, UEM: 0.6425, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1749, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.5804, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 70%|####### | 78/111 [00:49<00:20, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9581, LAS: 0.9210, UEM: 0.6432, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2130, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5795, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||: 74%|#######3 | 82/111 [00:52<00:18, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9580, LAS: 0.9209, UEM: 0.6464, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.5795, batch_reg_loss: 0.1672, reg_loss: 0.1674 ||: 77%|#######7 | 86/111 [00:55<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9579, LAS: 0.9210, UEM: 0.6548, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8256, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7588, loss: 0.5791, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 81%|########1 | 90/111 [00:58<00:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9581, LAS: 0.9212, UEM: 0.6497, LEM: 0.4266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5515, loss: 0.5793, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 85%|########4 | 94/111 [01:01<00:11, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9577, LAS: 0.9208, UEM: 0.6408, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4775, partial_loss/deprel_loss: 0.4866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6519, loss: 0.5825, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 88%|########8 | 98/111 [01:04<00:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9580, LAS: 0.9210, UEM: 0.6418, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.5806, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 92%|#########1| 102/111 [01:06<00:05, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9581, LAS: 0.9211, UEM: 0.6415, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6017, loss: 0.5786, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 95%|#########5| 106/111 [01:09<00:03, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9576, LAS: 0.9205, UEM: 0.6366, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5686, loss: 0.5836, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 99%|#########9| 110/111 [01:12<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9574, LAS: 0.9204, UEM: 0.6345, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.5845, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:08:33,893 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.496 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.602 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - reg_loss | 0.167 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UEM | 0.635 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LAS | 0.920 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - loss | 0.584 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEM | 0.410 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - UAS | 0.957 | N/A\n", + "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - EM | 0.908 | N/A\n", + "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:08:33,900 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:08:38,949 - INFO - combo.training.trainer - Epoch duration: 0:01:21.078534\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:08:38,950 - INFO - combo.training.trainer - Estimated training time remaining: 6:45:41\n", + "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Epoch 102/399\n", + "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:08:38,951 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:08:38,961 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9606, LAS: 0.9211, UEM: 0.6524, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.5691, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||: 4%|3 | 4/111 [00:02<01:05, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9652, LAS: 0.9307, UEM: 0.7796, LEM: 0.6236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4351, loss: 0.5078, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||: 6%|6 | 7/111 [00:04<01:08, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9618, LAS: 0.9261, UEM: 0.7107, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.3575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5332, batch_reg_loss: 0.1671, reg_loss: 0.1672 ||: 10%|9 | 11/111 [00:07<01:04, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9634, LAS: 0.9282, UEM: 0.7425, LEM: 0.5678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0768, partial_loss/deprel_loss: 0.1740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3217, loss: 0.5227, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 13%|#2 | 14/111 [00:09<01:07, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9632, LAS: 0.9276, UEM: 0.7412, LEM: 0.5525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7525, partial_loss/deprel_loss: 0.5876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7877, loss: 0.5288, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 15%|#5 | 17/111 [00:11<01:06, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9589, LAS: 0.9228, UEM: 0.7120, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5075, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1065, loss: 0.5675, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 18%|#8 | 20/111 [00:13<01:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9608, LAS: 0.9247, UEM: 0.7363, LEM: 0.5412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2577, partial_loss/deprel_loss: 0.3379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5495, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 21%|## | 23/111 [00:15<01:01, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9585, LAS: 0.9220, UEM: 0.7148, LEM: 0.5201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8773, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8516, loss: 0.5670, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 24%|##4 | 27/111 [00:18<00:56, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9581, LAS: 0.9220, UEM: 0.7103, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5097, loss: 0.5672, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 28%|##7 | 31/111 [00:21<00:53, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9580, LAS: 0.9217, UEM: 0.7005, LEM: 0.4974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 31%|### | 34/111 [00:23<00:53, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9580, LAS: 0.9217, UEM: 0.6965, LEM: 0.4926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||: 33%|###3 | 37/111 [00:25<00:50, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9577, LAS: 0.9215, UEM: 0.6872, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1256, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3737, loss: 0.5715, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 38%|###7 | 42/111 [00:27<00:42, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9560, LAS: 0.9194, UEM: 0.6657, LEM: 0.4646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6179, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.5871, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 42%|####2 | 47/111 [00:30<00:37, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9558, LAS: 0.9192, UEM: 0.6558, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5090, partial_loss/deprel_loss: 0.4367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.5894, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 47%|####6 | 52/111 [00:32<00:32, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9564, LAS: 0.9201, UEM: 0.6553, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1447, partial_loss/deprel_loss: 0.2119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.5824, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 50%|##### | 56/111 [00:35<00:32, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9571, LAS: 0.9206, UEM: 0.6498, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2884, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.5802, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 54%|#####4 | 60/111 [00:38<00:32, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9577, LAS: 0.9213, UEM: 0.6562, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0998, partial_loss/deprel_loss: 0.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3561, loss: 0.5750, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 58%|#####7 | 64/111 [00:41<00:31, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9585, LAS: 0.9220, UEM: 0.6612, LEM: 0.4481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1420, partial_loss/deprel_loss: 0.3105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4438, loss: 0.5705, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 61%|######1 | 68/111 [00:44<00:30, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9588, LAS: 0.9223, UEM: 0.6601, LEM: 0.4452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.4427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.5690, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 64%|######3 | 71/111 [00:46<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9588, LAS: 0.9222, UEM: 0.6597, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7346, loss: 0.5689, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||: 67%|######6 | 74/111 [00:48<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9592, LAS: 0.9224, UEM: 0.6585, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.5679, batch_reg_loss: 0.1669, reg_loss: 0.1671 ||: 70%|####### | 78/111 [00:50<00:22, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9587, LAS: 0.9218, UEM: 0.6511, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7663, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7705, loss: 0.5723, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 74%|#######3 | 82/111 [00:53<00:19, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9592, LAS: 0.9222, UEM: 0.6537, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1484, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4355, loss: 0.5698, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 77%|#######7 | 86/111 [00:56<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9595, LAS: 0.9227, UEM: 0.6553, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4135, loss: 0.5666, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 80%|######## | 89/111 [00:58<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9593, LAS: 0.9226, UEM: 0.6498, LEM: 0.4279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5596, partial_loss/deprel_loss: 0.5026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6809, loss: 0.5676, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 84%|########3 | 93/111 [01:01<00:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9590, LAS: 0.9221, UEM: 0.6420, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4337, partial_loss/deprel_loss: 0.4895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.5714, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 87%|########7 | 97/111 [01:04<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9589, LAS: 0.9219, UEM: 0.6386, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5602, loss: 0.5725, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 90%|######### | 100/111 [01:06<00:07, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9590, LAS: 0.9220, UEM: 0.6363, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.4484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6383, loss: 0.5716, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||: 93%|#########2| 103/111 [01:08<00:05, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9591, LAS: 0.9222, UEM: 0.6381, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 0.3158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4642, loss: 0.5704, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||: 95%|#########5| 106/111 [01:10<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9586, LAS: 0.9217, UEM: 0.6342, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4813, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.5739, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||: 99%|#########9| 110/111 [01:13<00:00, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9585, LAS: 0.9215, UEM: 0.6323, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6699, partial_loss/deprel_loss: 0.5022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5751, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.502 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.670 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - reg_loss | 0.167 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UEM | 0.632 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - loss | 0.575 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEM | 0.410 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EM | 0.903 | N/A\n", + "2023-04-07 01:09:55,425 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:09:55,430 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Epoch duration: 0:01:20.620700\n", + "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Estimated training time remaining: 6:44:16\n", + "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Epoch 103/399\n", + "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:09:59,572 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:09:59,580 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9667, LAS: 0.9267, UEM: 0.6543, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5462, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 4%|3 | 4/111 [00:02<01:16, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9632, LAS: 0.9251, UEM: 0.6317, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.3413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4771, loss: 0.5638, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 6%|6 | 7/111 [00:04<01:13, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9657, LAS: 0.9289, UEM: 0.7378, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0321, partial_loss/deprel_loss: 0.1224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2712, loss: 0.5427, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 9%|9 | 10/111 [00:07<01:15, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9589, LAS: 0.9227, UEM: 0.6830, LEM: 0.4771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7209, loss: 0.5806, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 13%|#2 | 14/111 [00:10<01:09, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9609, LAS: 0.9240, UEM: 0.6861, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2205, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5681, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 15%|#5 | 17/111 [00:12<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9623, LAS: 0.9250, UEM: 0.7001, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6032, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6846, loss: 0.5604, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 18%|#8 | 20/111 [00:14<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9602, LAS: 0.9230, UEM: 0.6678, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5714, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 22%|##1 | 24/111 [00:16<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9611, LAS: 0.9240, UEM: 0.6702, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5612, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||: 26%|##6 | 29/111 [00:19<00:51, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9599, LAS: 0.9224, UEM: 0.6433, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5697, loss: 0.5704, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 31%|### | 34/111 [00:21<00:44, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9598, LAS: 0.9225, UEM: 0.6343, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5673, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 35%|###5 | 39/111 [00:23<00:39, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9603, LAS: 0.9230, UEM: 0.6486, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5966, partial_loss/deprel_loss: 0.5535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7288, loss: 0.5641, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 39%|###8 | 43/111 [00:26<00:38, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9583, LAS: 0.9213, UEM: 0.6354, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.5782, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 42%|####2 | 47/111 [00:29<00:39, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9562, LAS: 0.9189, UEM: 0.6229, LEM: 0.4013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9840, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5938, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 46%|####5 | 51/111 [00:31<00:37, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9570, LAS: 0.9198, UEM: 0.6357, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5857, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 50%|####9 | 55/111 [00:35<00:37, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9578, LAS: 0.9206, UEM: 0.6415, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1857, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.5814, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||: 53%|#####3 | 59/111 [00:37<00:34, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9581, LAS: 0.9210, UEM: 0.6393, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4735, loss: 0.5791, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||: 57%|#####6 | 63/111 [00:40<00:33, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9585, LAS: 0.9215, UEM: 0.6440, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6223, loss: 0.5752, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||: 59%|#####9 | 66/111 [00:43<00:33, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9576, LAS: 0.9204, UEM: 0.6336, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8020, loss: 0.5839, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 62%|######2 | 69/111 [00:45<00:31, 1.34it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9574, LAS: 0.9203, UEM: 0.6283, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5206, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 65%|######4 | 72/111 [00:47<00:29, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9574, LAS: 0.9204, UEM: 0.6231, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3128, partial_loss/deprel_loss: 0.3818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 68%|######7 | 75/111 [00:50<00:27, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9578, LAS: 0.9211, UEM: 0.6336, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4455, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.5806, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 70%|####### | 78/111 [00:52<00:25, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9577, LAS: 0.9210, UEM: 0.6295, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6275, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7015, loss: 0.5811, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 74%|#######3 | 82/111 [00:55<00:22, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9580, LAS: 0.9213, UEM: 0.6309, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3798, partial_loss/deprel_loss: 0.3906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.5784, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 77%|#######7 | 86/111 [00:58<00:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9579, LAS: 0.9213, UEM: 0.6258, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.5247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7061, loss: 0.5788, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 81%|########1 | 90/111 [01:00<00:14, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9580, LAS: 0.9214, UEM: 0.6220, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3268, partial_loss/deprel_loss: 0.3844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5793, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 85%|########4 | 94/111 [01:02<00:11, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9583, LAS: 0.9216, UEM: 0.6287, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1964, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.5763, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||: 88%|########8 | 98/111 [01:05<00:08, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9591, LAS: 0.9225, UEM: 0.6436, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5697, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 92%|#########1| 102/111 [01:08<00:06, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9582, LAS: 0.9216, UEM: 0.6361, LEM: 0.4093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8615, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 0.5751, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 95%|#########5| 106/111 [01:11<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9584, LAS: 0.9217, UEM: 0.6389, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5202, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.5732, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 99%|#########9| 110/111 [01:14<00:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9585, LAS: 0.9218, UEM: 0.6393, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2825, partial_loss/deprel_loss: 0.3588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 0.5726, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 100%|##########| 111/111 [01:14<00:00, 1.48it/s]\n", + "2023-04-07 01:11:17,321 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.359 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.282 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - reg_loss | 0.167 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UEM | 0.639 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - loss | 0.573 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEM | 0.412 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EM | 0.930 | N/A\n", + "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:11:17,334 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Epoch duration: 0:01:22.560293\n", + "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Estimated training time remaining: 6:42:57\n", + "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Epoch 104/399\n", + "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:11:22,133 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:11:22,143 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9579, LAS: 0.9237, UEM: 0.4843, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4918, partial_loss/deprel_loss: 0.4045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5448, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 3%|2 | 3/111 [00:02<01:12, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9596, LAS: 0.9227, UEM: 0.5784, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2692, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5189, loss: 0.5343, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 5%|5 | 6/111 [00:04<01:12, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9639, LAS: 0.9279, UEM: 0.6773, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4708, partial_loss/deprel_loss: 0.4108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5089, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 8%|8 | 9/111 [00:06<01:10, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9582, LAS: 0.9228, UEM: 0.6431, LEM: 0.4054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.5546, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 13%|#2 | 14/111 [00:08<01:01, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9574, LAS: 0.9219, UEM: 0.6226, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2362, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4512, loss: 0.5644, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||: 17%|#7 | 19/111 [00:11<00:54, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9592, LAS: 0.9236, UEM: 0.6460, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.5537, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||: 22%|##1 | 24/111 [00:13<00:48, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9607, LAS: 0.9253, UEM: 0.6852, LEM: 0.4642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1332, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3697, loss: 0.5380, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||: 25%|##5 | 28/111 [00:16<00:50, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9590, LAS: 0.9238, UEM: 0.6721, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6512, loss: 0.5475, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||: 29%|##8 | 32/111 [00:19<00:50, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9587, LAS: 0.9229, UEM: 0.6562, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5505, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 0.5561, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||: 32%|###2 | 36/111 [00:21<00:47, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9583, LAS: 0.9225, UEM: 0.6445, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.5594, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||: 36%|###6 | 40/111 [00:24<00:45, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9579, LAS: 0.9221, UEM: 0.6292, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6220, loss: 0.5646, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||: 40%|###9 | 44/111 [00:27<00:44, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9591, LAS: 0.9233, UEM: 0.6478, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5555, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||: 43%|####3 | 48/111 [00:30<00:43, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9582, LAS: 0.9226, UEM: 0.6473, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6240, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7083, loss: 0.5615, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||: 46%|####5 | 51/111 [00:32<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9587, LAS: 0.9230, UEM: 0.6452, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2726, partial_loss/deprel_loss: 0.3050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.5592, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 49%|####8 | 54/111 [00:35<00:43, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9583, LAS: 0.9225, UEM: 0.6372, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6726, loss: 0.5631, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 51%|#####1 | 57/111 [00:37<00:40, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9576, LAS: 0.9218, UEM: 0.6313, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.5673, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 54%|#####4 | 60/111 [00:39<00:37, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9583, LAS: 0.9223, UEM: 0.6402, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 57%|#####6 | 63/111 [00:41<00:36, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9584, LAS: 0.9225, UEM: 0.6340, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2745, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4901, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 59%|#####9 | 66/111 [00:44<00:33, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9590, LAS: 0.9233, UEM: 0.6448, LEM: 0.4206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0997, partial_loss/deprel_loss: 0.2236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3651, loss: 0.5570, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 63%|######3 | 70/111 [00:46<00:28, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9587, LAS: 0.9229, UEM: 0.6394, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5598, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 67%|######6 | 74/111 [00:49<00:25, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9587, LAS: 0.9230, UEM: 0.6390, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8076, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.5591, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 70%|####### | 78/111 [00:51<00:20, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9590, LAS: 0.9232, UEM: 0.6394, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.5578, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||: 74%|#######3 | 82/111 [00:53<00:18, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9591, LAS: 0.9233, UEM: 0.6367, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4186, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.5577, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 77%|#######7 | 86/111 [00:56<00:15, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9588, LAS: 0.9227, UEM: 0.6289, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6325, partial_loss/deprel_loss: 0.5095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 81%|########1 | 90/111 [00:58<00:13, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9590, LAS: 0.9230, UEM: 0.6330, LEM: 0.4060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5602, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 85%|########4 | 94/111 [01:01<00:11, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9589, LAS: 0.9227, UEM: 0.6276, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5134, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 88%|########8 | 98/111 [01:03<00:08, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9581, LAS: 0.9220, UEM: 0.6366, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0334, partial_loss/deprel_loss: 0.1020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5686, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 92%|#########1| 102/111 [01:06<00:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9582, LAS: 0.9220, UEM: 0.6356, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5684, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||: 95%|#########5| 106/111 [01:09<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9585, LAS: 0.9225, UEM: 0.6374, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3568, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.5656, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||: 99%|#########9| 110/111 [01:12<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9585, LAS: 0.9225, UEM: 0.6356, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4134, partial_loss/deprel_loss: 0.4592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6162, loss: 0.5660, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.459 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.413 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - reg_loss | 0.166 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UEM | 0.636 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - loss | 0.566 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEM | 0.415 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UAS | 0.958 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EM | 0.921 | N/A\n", + "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:12:38,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:12:43,544 - INFO - combo.training.trainer - Epoch duration: 0:01:21.411689\n", + "2023-04-07 01:12:43,545 - INFO - combo.training.trainer - Estimated training time remaining: 6:41:35\n", + "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Epoch 105/399\n", + "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:12:43,546 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:12:43,555 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9605, LAS: 0.9238, UEM: 0.5154, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5467, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||: 4%|3 | 4/111 [00:02<00:54, 1.95it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9555, LAS: 0.9193, UEM: 0.4861, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5006, loss: 0.5761, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||: 7%|7 | 8/111 [00:04<00:55, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9566, LAS: 0.9206, UEM: 0.5133, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6513, loss: 0.5721, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||: 11%|# | 12/111 [00:06<00:54, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9589, LAS: 0.9236, UEM: 0.5616, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2420, partial_loss/deprel_loss: 0.3775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.5580, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||: 14%|#4 | 16/111 [00:09<00:55, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9586, LAS: 0.9240, UEM: 0.5809, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7090, partial_loss/deprel_loss: 0.4814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6930, loss: 0.5559, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||: 18%|#8 | 20/111 [00:11<00:52, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9578, LAS: 0.9217, UEM: 0.5885, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4395, loss: 0.5726, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||: 22%|##1 | 24/111 [00:13<00:49, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9590, LAS: 0.9226, UEM: 0.5978, LEM: 0.3627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 0.5674, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||: 26%|##6 | 29/111 [00:16<00:43, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9586, LAS: 0.9223, UEM: 0.5805, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6027, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7412, loss: 0.5714, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||: 30%|##9 | 33/111 [00:18<00:42, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9587, LAS: 0.9221, UEM: 0.6065, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2653, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5404, loss: 0.5698, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||: 33%|###3 | 37/111 [00:21<00:43, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9594, LAS: 0.9225, UEM: 0.6225, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2054, partial_loss/deprel_loss: 0.3136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.5648, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||: 37%|###6 | 41/111 [00:24<00:44, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9591, LAS: 0.9220, UEM: 0.6231, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.5681, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 41%|#### | 45/111 [00:26<00:41, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9222, UEM: 0.6172, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5694, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 44%|####4 | 49/111 [00:29<00:39, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9592, LAS: 0.9220, UEM: 0.6134, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.5321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5711, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 48%|####7 | 53/111 [00:32<00:39, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9597, LAS: 0.9228, UEM: 0.6325, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2204, partial_loss/deprel_loss: 0.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4126, loss: 0.5662, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 50%|##### | 56/111 [00:34<00:39, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9752, UAS: 0.9606, LAS: 0.9240, UEM: 0.6598, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0256, partial_loss/deprel_loss: 0.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2456, loss: 0.5583, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 53%|#####3 | 59/111 [00:37<00:40, 1.28it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9606, LAS: 0.9239, UEM: 0.6677, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1025, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3735, loss: 0.5582, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 57%|#####6 | 63/111 [00:40<00:37, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9603, LAS: 0.9236, UEM: 0.6652, LEM: 0.4453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5848, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6681, loss: 0.5607, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 59%|#####9 | 66/111 [00:42<00:33, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9604, LAS: 0.9236, UEM: 0.6648, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1711, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5598, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 62%|######2 | 69/111 [00:44<00:31, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9592, LAS: 0.9223, UEM: 0.6538, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0157, partial_loss/deprel_loss: 0.6286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8720, loss: 0.5674, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||: 66%|######5 | 73/111 [00:47<00:26, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9588, LAS: 0.9219, UEM: 0.6449, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.4270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.5712, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||: 69%|######9 | 77/111 [00:49<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9580, LAS: 0.9211, UEM: 0.6370, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9152, partial_loss/deprel_loss: 0.6189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8441, loss: 0.5799, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||: 72%|#######2 | 80/111 [00:51<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9576, LAS: 0.9209, UEM: 0.6312, LEM: 0.4145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5808, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||: 75%|#######4 | 83/111 [00:54<00:19, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9583, LAS: 0.9215, UEM: 0.6427, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1461, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4299, loss: 0.5761, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||: 77%|#######7 | 86/111 [00:56<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9589, LAS: 0.9221, UEM: 0.6461, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1714, partial_loss/deprel_loss: 0.3043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5725, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 81%|########1 | 90/111 [00:58<00:14, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9593, LAS: 0.9225, UEM: 0.6463, LEM: 0.4227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1769, partial_loss/deprel_loss: 0.2699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5698, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 85%|########4 | 94/111 [01:01<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9595, LAS: 0.9228, UEM: 0.6455, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2810, partial_loss/deprel_loss: 0.3794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5256, loss: 0.5681, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 88%|########8 | 98/111 [01:03<00:08, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9592, LAS: 0.9224, UEM: 0.6407, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5674, partial_loss/deprel_loss: 0.3946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5951, loss: 0.5697, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 92%|#########1| 102/111 [01:06<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9595, LAS: 0.9227, UEM: 0.6432, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.5678, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 95%|#########5| 106/111 [01:09<00:03, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9588, LAS: 0.9218, UEM: 0.6365, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3701, partial_loss/deprel_loss: 0.8036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0827, loss: 0.5747, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 99%|#########9| 110/111 [01:12<00:00, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9586, LAS: 0.9217, UEM: 0.6349, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6125, partial_loss/deprel_loss: 0.5305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.5760, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 01:13:59,528 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9553, LAS: 0.9111, UEM: 0.7989, LEM: 0.6196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1845, partial_loss/deprel_loss: 18.4393, partial_loss/cycle_loss: 0.0000, batch_loss: 14.7883, loss: 19.5219, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.05s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9480, LAS: 0.9002, UEM: 0.6879, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4402, partial_loss/deprel_loss: 23.9572, partial_loss/cycle_loss: 0.0000, batch_loss: 19.2538, loss: 24.4794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:07, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9532, LAS: 0.9045, UEM: 0.6803, LEM: 0.4123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7114, partial_loss/deprel_loss: 29.0657, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3948, loss: 22.1284, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:07<00:03, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9449, LAS: 0.8945, UEM: 0.6256, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0921, partial_loss/deprel_loss: 41.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 33.5107, loss: 25.4303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:09<00:00, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9476, LAS: 0.8979, UEM: 0.6576, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1506, partial_loss/deprel_loss: 22.9104, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3585, loss: 24.8863, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00, 1.29it/s]\n", + "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.530 | 22.910\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.613 | 0.151\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - reg_loss | 0.166 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UEM | 0.635 | 0.658\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LAS | 0.922 | 0.898\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - loss | 0.576 | 24.886\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEM | 0.409 | 0.394\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | 0.948\n", + "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - EM | 0.905 | 0.939\n", + "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:14:09,626 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:14:14,904 - INFO - combo.training.trainer - Epoch duration: 0:01:31.359274\n", + "2023-04-07 01:14:14,905 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:40\n", + "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Epoch 106/399\n", + "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:14:14,906 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:14:14,916 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9597, LAS: 0.9221, UEM: 0.6360, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5495, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 4%|3 | 4/111 [00:02<01:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9562, LAS: 0.9204, UEM: 0.6661, LEM: 0.4711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6598, partial_loss/deprel_loss: 0.4809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6825, loss: 0.5676, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 6%|6 | 7/111 [00:04<01:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9575, LAS: 0.9226, UEM: 0.6810, LEM: 0.4839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7804, partial_loss/deprel_loss: 0.6168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.5618, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 9%|9 | 10/111 [00:07<01:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9585, LAS: 0.9235, UEM: 0.6787, LEM: 0.4796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 12%|#1 | 13/111 [00:09<01:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9589, LAS: 0.9241, UEM: 0.6982, LEM: 0.5117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7424, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 14%|#4 | 16/111 [00:11<01:08, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9575, LAS: 0.9222, UEM: 0.6738, LEM: 0.4852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6464, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.5711, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 17%|#7 | 19/111 [00:13<01:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9568, LAS: 0.9216, UEM: 0.6542, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2399, partial_loss/deprel_loss: 0.2948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4496, loss: 0.5771, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 21%|## | 23/111 [00:16<01:02, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9569, LAS: 0.9217, UEM: 0.6400, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2381, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.5755, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 24%|##4 | 27/111 [00:19<00:58, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9582, LAS: 0.9229, UEM: 0.6431, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.5670, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 28%|##7 | 31/111 [00:21<00:52, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9594, LAS: 0.9240, UEM: 0.6449, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3148, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.5601, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 32%|###1 | 35/111 [00:24<00:51, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9232, UEM: 0.6442, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8498, partial_loss/deprel_loss: 0.6169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5630, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||: 34%|###4 | 38/111 [00:26<00:49, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9595, LAS: 0.9239, UEM: 0.6561, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7706, partial_loss/deprel_loss: 0.5407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7524, loss: 0.5581, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 37%|###6 | 41/111 [00:28<00:48, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9595, LAS: 0.9238, UEM: 0.6468, LEM: 0.4285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6490, loss: 0.5583, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 41%|#### | 45/111 [00:31<00:45, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9591, LAS: 0.9235, UEM: 0.6394, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7228, loss: 0.5618, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 43%|####3 | 48/111 [00:33<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9593, LAS: 0.9236, UEM: 0.6394, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4952, partial_loss/deprel_loss: 0.4717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5602, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 46%|####5 | 51/111 [00:35<00:42, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9601, LAS: 0.9243, UEM: 0.6537, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4148, loss: 0.5541, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 49%|####8 | 54/111 [00:38<00:43, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9597, LAS: 0.9237, UEM: 0.6536, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.5575, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 51%|#####1 | 57/111 [00:40<00:40, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9588, LAS: 0.9227, UEM: 0.6441, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6947, loss: 0.5655, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 54%|#####4 | 60/111 [00:42<00:38, 1.33it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9592, LAS: 0.9230, UEM: 0.6392, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3362, partial_loss/deprel_loss: 0.4284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5756, loss: 0.5650, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 58%|#####7 | 64/111 [00:44<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9229, UEM: 0.6352, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5645, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 61%|######1 | 68/111 [00:47<00:28, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9587, LAS: 0.9225, UEM: 0.6254, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5371, partial_loss/deprel_loss: 0.5104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.5688, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||: 65%|######4 | 72/111 [00:49<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9586, LAS: 0.9223, UEM: 0.6207, LEM: 0.3927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5256, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5691, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 68%|######8 | 76/111 [00:52<00:23, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9587, LAS: 0.9223, UEM: 0.6193, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1841, partial_loss/deprel_loss: 0.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4547, loss: 0.5685, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 72%|#######2 | 80/111 [00:55<00:22, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9590, LAS: 0.9226, UEM: 0.6208, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.5656, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 75%|#######4 | 83/111 [00:58<00:20, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9588, LAS: 0.9222, UEM: 0.6164, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5515, partial_loss/deprel_loss: 0.5246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.5683, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 77%|#######7 | 86/111 [01:00<00:17, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9583, LAS: 0.9218, UEM: 0.6130, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.5711, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 80%|######## | 89/111 [01:02<00:15, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9588, LAS: 0.9224, UEM: 0.6181, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1722, partial_loss/deprel_loss: 0.2980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4384, loss: 0.5672, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 84%|########3 | 93/111 [01:04<00:12, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9594, LAS: 0.9231, UEM: 0.6311, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0772, partial_loss/deprel_loss: 0.2163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3541, loss: 0.5627, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 88%|########8 | 98/111 [01:07<00:08, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9593, LAS: 0.9232, UEM: 0.6285, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6855, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.5622, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||: 93%|#########2| 103/111 [01:09<00:04, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9589, LAS: 0.9229, UEM: 0.6367, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6451, loss: 0.5652, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 96%|#########6| 107/111 [01:11<00:02, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.506 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.690 | N/A\n", + "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - reg_loss | 0.166 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UEM | 0.639 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LAS | 0.923 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - loss | 0.564 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEM | 0.415 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EM | 0.907 | N/A\n", + "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:15:32,914 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:15:37,937 - INFO - combo.training.trainer - Epoch duration: 0:01:23.032082\n", + "2023-04-07 01:15:37,938 - INFO - combo.training.trainer - Estimated training time remaining: 6:39:22\n", + "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Epoch 107/399\n", + "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:15:37,939 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:15:37,951 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9404, LAS: 0.9045, UEM: 0.1818, LEM: 0.0670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6183, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.7128, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9551, LAS: 0.9217, UEM: 0.7477, LEM: 0.6220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4707, loss: 0.5912, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 5%|5 | 6/111 [00:04<01:20, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9598, LAS: 0.9264, UEM: 0.7318, LEM: 0.5729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5564, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 8%|8 | 9/111 [00:06<01:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9638, LAS: 0.9295, UEM: 0.7680, LEM: 0.5838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0983, partial_loss/deprel_loss: 0.1903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3374, loss: 0.5257, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 11%|# | 12/111 [00:09<01:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9645, LAS: 0.9301, UEM: 0.7532, LEM: 0.5563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5021, loss: 0.5165, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 14%|#4 | 16/111 [00:12<01:10, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9611, LAS: 0.9260, UEM: 0.7304, LEM: 0.5306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0098, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.5462, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 17%|#7 | 19/111 [00:14<01:07, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9604, LAS: 0.9254, UEM: 0.7239, LEM: 0.5191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9762, partial_loss/deprel_loss: 0.5604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8090, loss: 0.5532, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 20%|#9 | 22/111 [00:16<01:06, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9597, LAS: 0.9250, UEM: 0.7145, LEM: 0.5123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6173, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6822, loss: 0.5542, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 23%|##2 | 25/111 [00:18<01:03, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9588, LAS: 0.9239, UEM: 0.6825, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4539, partial_loss/deprel_loss: 0.4544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5627, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||: 26%|##6 | 29/111 [00:21<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9579, LAS: 0.9230, UEM: 0.6704, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8390, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7380, loss: 0.5715, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 29%|##8 | 32/111 [00:23<00:55, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9584, LAS: 0.9234, UEM: 0.6645, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3485, partial_loss/deprel_loss: 0.3792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5385, loss: 0.5686, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 32%|###1 | 35/111 [00:25<00:53, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9585, LAS: 0.9232, UEM: 0.6623, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6749, loss: 0.5675, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 34%|###4 | 38/111 [00:27<00:50, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9595, LAS: 0.9242, UEM: 0.6705, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.5603, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 37%|###6 | 41/111 [00:29<00:49, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9595, LAS: 0.9238, UEM: 0.6617, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.5607, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 41%|#### | 45/111 [00:32<00:44, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9233, UEM: 0.6512, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4623, loss: 0.5633, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 44%|####4 | 49/111 [00:34<00:39, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6471, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3814, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5621, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 48%|####7 | 53/111 [00:36<00:36, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9592, LAS: 0.9237, UEM: 0.6426, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2156, partial_loss/deprel_loss: 0.3679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.5612, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 51%|#####1 | 57/111 [00:39<00:34, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9596, LAS: 0.9240, UEM: 0.6447, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1229, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4231, loss: 0.5587, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||: 55%|#####4 | 61/111 [00:42<00:32, 1.53it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9597, LAS: 0.9239, UEM: 0.6410, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5022, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.5594, batch_reg_loss: 0.1654, reg_loss: 0.1654 ||: 59%|#####8 | 65/111 [00:44<00:29, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9589, LAS: 0.9234, UEM: 0.6424, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1442, partial_loss/deprel_loss: 0.2097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3620, loss: 0.5627, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 62%|######2 | 69/111 [00:47<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9592, LAS: 0.9236, UEM: 0.6441, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.5617, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 66%|######5 | 73/111 [00:50<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9599, LAS: 0.9243, UEM: 0.6642, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0766, partial_loss/deprel_loss: 0.1825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3266, loss: 0.5553, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 70%|####### | 78/111 [00:52<00:20, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9604, LAS: 0.9248, UEM: 0.6636, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5532, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 75%|#######4 | 83/111 [00:54<00:15, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9605, LAS: 0.9249, UEM: 0.6583, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.5531, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 79%|#######9 | 88/111 [00:57<00:12, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9603, LAS: 0.9246, UEM: 0.6530, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5549, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 83%|########2 | 92/111 [00:59<00:10, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9597, LAS: 0.9239, UEM: 0.6455, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6310, partial_loss/deprel_loss: 0.5527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7336, loss: 0.5602, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||: 86%|########6 | 96/111 [01:02<00:08, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9233, UEM: 0.6407, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9582, partial_loss/deprel_loss: 0.5912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8299, loss: 0.5646, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 90%|######### | 100/111 [01:04<00:06, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9591, LAS: 0.9231, UEM: 0.6373, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5348, loss: 0.5664, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 94%|#########3| 104/111 [01:08<00:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9592, LAS: 0.9232, UEM: 0.6353, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.4573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.5661, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 97%|#########7| 108/111 [01:10<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9596, LAS: 0.9237, UEM: 0.6431, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.3154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5627, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.315 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.255 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - reg_loss | 0.165 | N/A\n", + "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UEM | 0.643 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - loss | 0.563 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEM | 0.419 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EM | 0.936 | N/A\n", + "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:16:54,114 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:16:59,229 - INFO - combo.training.trainer - Epoch duration: 0:01:21.291164\n", + "2023-04-07 01:16:59,230 - INFO - combo.training.trainer - Estimated training time remaining: 6:37:58\n", + "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Epoch 108/399\n", + "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:16:59,239 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9553, LAS: 0.9185, UEM: 0.4522, LEM: 0.2261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.6150, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 3%|2 | 3/111 [00:02<01:15, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9546, LAS: 0.9193, UEM: 0.4889, LEM: 0.2563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.6051, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 5%|5 | 6/111 [00:04<01:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9595, LAS: 0.9240, UEM: 0.6025, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1919, partial_loss/deprel_loss: 0.2749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4235, loss: 0.5659, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 8%|8 | 9/111 [00:06<01:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9532, LAS: 0.9178, UEM: 0.5312, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0256, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8277, loss: 0.5976, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 12%|#1 | 13/111 [00:09<01:08, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9536, LAS: 0.9181, UEM: 0.5355, LEM: 0.3208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5954, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 14%|#4 | 16/111 [00:11<01:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9538, LAS: 0.9180, UEM: 0.5170, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4307, partial_loss/deprel_loss: 0.3894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5964, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 17%|#7 | 19/111 [00:13<01:04, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9534, LAS: 0.9171, UEM: 0.5024, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.4720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6483, loss: 0.5977, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 20%|#9 | 22/111 [00:15<01:01, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9547, LAS: 0.9183, UEM: 0.5345, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6225, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5869, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 23%|##2 | 25/111 [00:17<01:02, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9568, LAS: 0.9208, UEM: 0.5885, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3942, loss: 0.5704, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||: 25%|##5 | 28/111 [00:19<00:59, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9567, LAS: 0.9207, UEM: 0.5925, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6408, partial_loss/deprel_loss: 0.6466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.5757, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 28%|##7 | 31/111 [00:22<00:59, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9570, LAS: 0.9211, UEM: 0.5842, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5759, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 31%|### | 34/111 [00:24<00:56, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9571, LAS: 0.9210, UEM: 0.5775, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5832, partial_loss/deprel_loss: 0.5241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.5768, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 33%|###3 | 37/111 [00:26<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9566, LAS: 0.9205, UEM: 0.5616, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5129, partial_loss/deprel_loss: 0.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.5796, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 37%|###6 | 41/111 [00:29<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9568, LAS: 0.9208, UEM: 0.5599, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7523, partial_loss/deprel_loss: 0.5404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7479, loss: 0.5798, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 41%|#### | 45/111 [00:31<00:44, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9573, LAS: 0.9212, UEM: 0.5717, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.3491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.5767, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 43%|####3 | 48/111 [00:33<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9577, LAS: 0.9217, UEM: 0.5806, LEM: 0.3533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 0.5721, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 46%|####5 | 51/111 [00:35<00:42, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9585, LAS: 0.9226, UEM: 0.6101, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0995, partial_loss/deprel_loss: 0.1774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3269, loss: 0.5642, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 49%|####8 | 54/111 [00:38<00:40, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9580, LAS: 0.9222, UEM: 0.6093, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9579, partial_loss/deprel_loss: 0.6240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8558, loss: 0.5683, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||: 51%|#####1 | 57/111 [00:40<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9593, LAS: 0.9234, UEM: 0.6378, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4303, loss: 0.5589, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||: 55%|#####4 | 61/111 [00:42<00:33, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9597, LAS: 0.9237, UEM: 0.6403, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.5568, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||: 59%|#####8 | 65/111 [00:44<00:28, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9601, LAS: 0.9239, UEM: 0.6396, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4998, loss: 0.5548, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 63%|######3 | 70/111 [00:46<00:22, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9602, LAS: 0.9242, UEM: 0.6355, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5529, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 68%|######7 | 75/111 [00:49<00:19, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9609, LAS: 0.9247, UEM: 0.6496, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4851, loss: 0.5488, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 71%|#######1 | 79/111 [00:51<00:18, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9605, LAS: 0.9245, UEM: 0.6596, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6113, partial_loss/deprel_loss: 0.5152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6994, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 75%|#######4 | 83/111 [00:55<00:18, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9602, LAS: 0.9244, UEM: 0.6551, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4968, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 78%|#######8 | 87/111 [00:58<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9606, LAS: 0.9248, UEM: 0.6565, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.3940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5639, loss: 0.5483, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||: 82%|########1 | 91/111 [01:00<00:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9600, LAS: 0.9242, UEM: 0.6535, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6841, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.5532, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 86%|########5 | 95/111 [01:03<00:10, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9598, LAS: 0.9239, UEM: 0.6465, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.5551, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 89%|########9 | 99/111 [01:05<00:07, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5557, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 93%|#########2| 103/111 [01:08<00:05, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9592, LAS: 0.9235, UEM: 0.6426, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7170, loss: 0.5577, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 96%|#########6| 107/111 [01:11<00:02, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 01:18:15,970 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.441 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.469 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - reg_loss | 0.165 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UEM | 0.640 | N/A\n", + "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - loss | 0.558 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEM | 0.416 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EM | 0.922 | N/A\n", + "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:18:15,977 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Epoch duration: 0:01:21.274289\n", + "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Estimated training time remaining: 6:36:35\n", + "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Epoch 109/399\n", + "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:18:20,511 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9593, LAS: 0.9236, UEM: 0.6521, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6639, loss: 0.5311, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||: 3%|2 | 3/111 [00:02<01:20, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9639, LAS: 0.9292, UEM: 0.6776, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3725, loss: 0.5108, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||: 6%|6 | 7/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9647, LAS: 0.9301, UEM: 0.7206, LEM: 0.5242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5017, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.4998, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||: 9%|9 | 10/111 [00:07<01:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9639, LAS: 0.9291, UEM: 0.6909, LEM: 0.4869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2603, partial_loss/deprel_loss: 0.3373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5078, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||: 12%|#1 | 13/111 [00:09<01:09, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9650, LAS: 0.9297, UEM: 0.7081, LEM: 0.4977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1774, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4507, loss: 0.5012, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||: 14%|#4 | 16/111 [00:11<01:09, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9652, LAS: 0.9295, UEM: 0.7043, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1694, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.5025, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||: 17%|#7 | 19/111 [00:13<01:06, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9654, LAS: 0.9295, UEM: 0.6904, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5185, loss: 0.5048, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||: 20%|#9 | 22/111 [00:15<01:04, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9639, LAS: 0.9277, UEM: 0.6742, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6014, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6864, loss: 0.5192, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||: 23%|##3 | 26/111 [00:18<00:59, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9629, LAS: 0.9264, UEM: 0.6690, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9460, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8939, loss: 0.5308, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||: 26%|##6 | 29/111 [00:20<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9615, LAS: 0.9251, UEM: 0.6499, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5409, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||: 29%|##8 | 32/111 [00:22<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9618, LAS: 0.9255, UEM: 0.6579, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||: 32%|###1 | 35/111 [00:24<00:54, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9622, LAS: 0.9256, UEM: 0.6576, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5119, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||: 35%|###5 | 39/111 [00:27<00:49, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9624, LAS: 0.9262, UEM: 0.6782, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6272, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.5356, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||: 38%|###7 | 42/111 [00:29<00:50, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9618, LAS: 0.9259, UEM: 0.6666, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6737, loss: 0.5404, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||: 42%|####2 | 47/111 [00:32<00:42, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9612, LAS: 0.9255, UEM: 0.6695, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5427, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 46%|####5 | 51/111 [00:35<00:40, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9617, LAS: 0.9261, UEM: 0.6680, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.5398, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 50%|####9 | 55/111 [00:37<00:35, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9620, LAS: 0.9264, UEM: 0.6709, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.2889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.5356, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 53%|#####3 | 59/111 [00:40<00:34, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9621, LAS: 0.9265, UEM: 0.6713, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5340, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 57%|#####6 | 63/111 [00:43<00:32, 1.47it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9622, LAS: 0.9267, UEM: 0.6706, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.2805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4222, loss: 0.5326, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 60%|###### | 67/111 [00:45<00:28, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9617, LAS: 0.9261, UEM: 0.6613, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2136, partial_loss/deprel_loss: 0.3104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.5385, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 65%|######4 | 72/111 [00:47<00:23, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9610, LAS: 0.9255, UEM: 0.6554, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.4840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6818, loss: 0.5429, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 68%|######8 | 76/111 [00:50<00:21, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9607, LAS: 0.9252, UEM: 0.6508, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5461, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 72%|#######2 | 80/111 [00:52<00:18, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9607, LAS: 0.9251, UEM: 0.6457, LEM: 0.4202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.5473, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||: 76%|#######5 | 84/111 [00:55<00:16, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9606, LAS: 0.9251, UEM: 0.6512, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8519, loss: 0.5472, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9607, LAS: 0.9251, UEM: 0.6511, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5113, loss: 0.5471, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||: 83%|########2 | 92/111 [01:00<00:12, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9605, LAS: 0.9250, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0870, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3612, loss: 0.5474, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||: 86%|########6 | 96/111 [01:03<00:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9600, LAS: 0.9245, UEM: 0.6535, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.5521, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||: 90%|######### | 100/111 [01:06<00:07, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9596, LAS: 0.9239, UEM: 0.6484, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.4882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.5571, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||: 94%|#########3| 104/111 [01:08<00:04, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9596, LAS: 0.9239, UEM: 0.6458, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4867, loss: 0.5568, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||: 97%|#########7| 108/111 [01:11<00:01, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.5579, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.372 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.227 | N/A\n", + "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - reg_loss | 0.165 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UEM | 0.643 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - loss | 0.558 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEM | 0.420 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EM | 0.929 | N/A\n", + "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:19:36,953 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Epoch duration: 0:01:21.083316\n", + "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Estimated training time remaining: 6:35:12\n", + "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Epoch 110/399\n", + "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:19:41,614 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9717, LAS: 0.9407, UEM: 0.8579, LEM: 0.7503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4825, partial_loss/deprel_loss: 0.4682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6356, loss: 0.4710, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||: 3%|2 | 3/111 [00:02<01:23, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9648, LAS: 0.9312, UEM: 0.7607, LEM: 0.6095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.3122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4630, loss: 0.5286, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||: 5%|5 | 6/111 [00:04<01:19, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9631, LAS: 0.9301, UEM: 0.7603, LEM: 0.6183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5614, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7401, loss: 0.5314, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||: 8%|8 | 9/111 [00:06<01:16, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9626, LAS: 0.9295, UEM: 0.7216, LEM: 0.5597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4509, loss: 0.5329, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||: 11%|# | 12/111 [00:08<01:14, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9602, LAS: 0.9259, UEM: 0.6921, LEM: 0.5212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.5588, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||: 14%|#3 | 15/111 [00:10<01:09, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9605, LAS: 0.9263, UEM: 0.6697, LEM: 0.4844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.5584, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||: 17%|#7 | 19/111 [00:13<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9598, LAS: 0.9255, UEM: 0.6550, LEM: 0.4644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1687, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5648, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||: 20%|#9 | 22/111 [00:15<01:03, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9586, LAS: 0.9242, UEM: 0.6355, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.4628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.5702, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||: 23%|##3 | 26/111 [00:18<00:58, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9580, LAS: 0.9236, UEM: 0.6279, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2239, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5715, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 27%|##7 | 30/111 [00:21<00:55, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9576, LAS: 0.9234, UEM: 0.6131, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.5330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7145, loss: 0.5735, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 30%|##9 | 33/111 [00:23<00:55, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9568, LAS: 0.9225, UEM: 0.6158, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2690, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5064, loss: 0.5788, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 32%|###2 | 36/111 [00:25<00:53, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9568, LAS: 0.9225, UEM: 0.6259, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0041, partial_loss/deprel_loss: 0.5339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.5774, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 35%|###5 | 39/111 [00:27<00:53, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9555, LAS: 0.9210, UEM: 0.6101, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8748, partial_loss/deprel_loss: 0.6011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8203, loss: 0.5890, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 39%|###8 | 43/111 [00:30<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9556, LAS: 0.9212, UEM: 0.5979, LEM: 0.3897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5680, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6151, loss: 0.5863, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 43%|####3 | 48/111 [00:32<00:39, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9562, LAS: 0.9215, UEM: 0.6145, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0934, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5821, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 48%|####7 | 53/111 [00:34<00:33, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9565, LAS: 0.9217, UEM: 0.6144, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.5790, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||: 51%|#####1 | 57/111 [00:36<00:30, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9562, LAS: 0.9214, UEM: 0.6066, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2144, partial_loss/deprel_loss: 0.3356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.5818, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 55%|#####4 | 61/111 [00:38<00:27, 1.84it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9565, LAS: 0.9219, UEM: 0.6104, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5782, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 59%|#####8 | 65/111 [00:42<00:28, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9564, LAS: 0.9217, UEM: 0.6083, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3418, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5789, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 62%|######2 | 69/111 [00:44<00:26, 1.58it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9572, LAS: 0.9223, UEM: 0.6156, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4749, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6363, loss: 0.5745, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 66%|######5 | 73/111 [00:47<00:25, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9575, LAS: 0.9226, UEM: 0.6203, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1145, partial_loss/deprel_loss: 0.2285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3701, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 69%|######9 | 77/111 [00:50<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9575, LAS: 0.9225, UEM: 0.6175, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5904, partial_loss/deprel_loss: 0.4982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.5731, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 73%|#######2 | 81/111 [00:53<00:21, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9576, LAS: 0.9226, UEM: 0.6186, LEM: 0.3954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 76%|#######5 | 84/111 [00:56<00:19, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9580, LAS: 0.9229, UEM: 0.6180, LEM: 0.3933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.5701, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 78%|#######8 | 87/111 [00:58<00:17, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9583, LAS: 0.9233, UEM: 0.6233, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1383, partial_loss/deprel_loss: 0.2481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3905, loss: 0.5673, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 81%|########1 | 90/111 [01:00<00:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9585, LAS: 0.9235, UEM: 0.6321, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6720, loss: 0.5650, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||: 84%|########3 | 93/111 [01:02<00:13, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9585, LAS: 0.9234, UEM: 0.6279, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3920, partial_loss/deprel_loss: 0.4626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6129, loss: 0.5658, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 86%|########6 | 96/111 [01:05<00:11, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9586, LAS: 0.9236, UEM: 0.6319, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6267, partial_loss/deprel_loss: 0.4552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.5635, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 89%|########9 | 99/111 [01:07<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9239, UEM: 0.6369, LEM: 0.4143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3991, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.5613, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 92%|#########1| 102/111 [01:09<00:06, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9594, LAS: 0.9242, UEM: 0.6422, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3173, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5157, loss: 0.5582, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 95%|#########4| 105/111 [01:12<00:04, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9597, LAS: 0.9245, UEM: 0.6444, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1521, partial_loss/deprel_loss: 0.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3741, loss: 0.5558, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 97%|#########7| 108/111 [01:14<00:02, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-07 01:21:01,093 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9641, LAS: 0.9129, UEM: 0.7128, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 25.4464, partial_loss/cycle_loss: 0.0000, batch_loss: 20.4318, loss: 19.6309, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:11, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9636, LAS: 0.9138, UEM: 0.7601, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1781, partial_loss/deprel_loss: 18.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 14.5213, loss: 19.2017, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:04<00:08, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9509, LAS: 0.9007, UEM: 0.7007, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1098, partial_loss/deprel_loss: 41.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2512, loss: 23.2837, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:08<00:05, 1.02s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9466, LAS: 0.8952, UEM: 0.6532, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3394, partial_loss/deprel_loss: 45.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 36.9685, loss: 25.1615, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 77%|#######6 | 10/13 [00:10<00:03, 1.01s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - patience | 6.000 | N/A\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.342 | 29.679\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.280 | 0.896\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - reg_loss | 0.164 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UEM | 0.646 | 0.658\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | 0.897\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - loss | 0.556 | 24.636\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEM | 0.419 | 0.397\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | 0.948\n", + "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - EM | 0.934 | 0.881\n", + "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:21:13,728 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:21:18,618 - INFO - combo.training.trainer - Epoch duration: 0:01:37.029658\n", + "2023-04-07 01:21:18,619 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:30\n", + "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Epoch 111/399\n", + "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:21:18,627 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9556, LAS: 0.9218, UEM: 0.4730, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.2881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5829, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||: 4%|3 | 4/111 [00:02<01:09, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9574, LAS: 0.9235, UEM: 0.4780, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.3992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5757, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||: 7%|7 | 8/111 [00:04<01:03, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9598, LAS: 0.9249, UEM: 0.5409, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2755, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5598, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||: 12%|#1 | 13/111 [00:06<00:55, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9620, LAS: 0.9272, UEM: 0.6094, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1368, partial_loss/deprel_loss: 0.2402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3838, loss: 0.5370, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||: 16%|#6 | 18/111 [00:09<00:48, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9626, LAS: 0.9280, UEM: 0.6157, LEM: 0.3911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5523, loss: 0.5314, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||: 20%|#9 | 22/111 [00:11<00:46, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9647, LAS: 0.9304, UEM: 0.6799, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.3935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5494, loss: 0.5178, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||: 23%|##3 | 26/111 [00:14<00:49, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9639, LAS: 0.9299, UEM: 0.6849, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4031, loss: 0.5199, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||: 27%|##7 | 30/111 [00:17<00:53, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9635, LAS: 0.9297, UEM: 0.7096, LEM: 0.5093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5201, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 30%|##9 | 33/111 [00:19<00:54, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9603, LAS: 0.9262, UEM: 0.6885, LEM: 0.4912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6263, partial_loss/deprel_loss: 0.5303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5447, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 33%|###3 | 37/111 [00:22<00:49, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9603, LAS: 0.9262, UEM: 0.6803, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5469, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 37%|###6 | 41/111 [00:24<00:44, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9592, LAS: 0.9249, UEM: 0.6709, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.5541, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 41%|#### | 45/111 [00:27<00:43, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9580, LAS: 0.9238, UEM: 0.6687, LEM: 0.4696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8114, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6917, loss: 0.5602, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 44%|####4 | 49/111 [00:30<00:41, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9581, LAS: 0.9238, UEM: 0.6645, LEM: 0.4654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5992, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6140, loss: 0.5593, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||: 48%|####7 | 53/111 [00:33<00:40, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9246, UEM: 0.6702, LEM: 0.4658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.5533, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 50%|##### | 56/111 [00:35<00:40, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9589, LAS: 0.9245, UEM: 0.6632, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6511, loss: 0.5547, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 53%|#####3 | 59/111 [00:37<00:37, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9591, LAS: 0.9245, UEM: 0.6607, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3761, partial_loss/deprel_loss: 0.4201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5754, loss: 0.5543, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 56%|#####5 | 62/111 [00:39<00:35, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9596, LAS: 0.9248, UEM: 0.6674, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4760, loss: 0.5503, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 59%|#####8 | 65/111 [00:41<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9597, LAS: 0.9248, UEM: 0.6682, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1707, partial_loss/deprel_loss: 0.2553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4025, loss: 0.5495, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 61%|######1 | 68/111 [00:44<00:31, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9599, LAS: 0.9250, UEM: 0.6684, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.2533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4004, loss: 0.5474, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 64%|######3 | 71/111 [00:46<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9600, LAS: 0.9251, UEM: 0.6631, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.5473, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 68%|######7 | 75/111 [00:48<00:24, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9592, LAS: 0.9241, UEM: 0.6583, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.5534, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 70%|####### | 78/111 [00:51<00:23, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9593, LAS: 0.9240, UEM: 0.6555, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.4539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.5546, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 73%|#######2 | 81/111 [00:53<00:21, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9593, LAS: 0.9240, UEM: 0.6541, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.2648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.5554, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 76%|#######5 | 84/111 [00:55<00:19, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9591, LAS: 0.9238, UEM: 0.6509, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.2569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5566, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 78%|#######8 | 87/111 [00:57<00:17, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9241, UEM: 0.6525, LEM: 0.4357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2041, partial_loss/deprel_loss: 0.2996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.5538, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||: 81%|########1 | 90/111 [00:59<00:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9597, LAS: 0.9243, UEM: 0.6539, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||: 85%|########4 | 94/111 [01:02<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9600, LAS: 0.9247, UEM: 0.6560, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5495, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||: 87%|########7 | 97/111 [01:04<00:09, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9596, LAS: 0.9243, UEM: 0.6499, LEM: 0.4312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4719, loss: 0.5512, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||: 91%|######### | 101/111 [01:09<00:08, 1.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9594, LAS: 0.9240, UEM: 0.6432, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4741, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.5547, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||: 95%|#########4| 105/111 [01:12<00:04, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9597, LAS: 0.9244, UEM: 0.6477, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2616, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5086, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||: 97%|#########7| 108/111 [01:14<00:02, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9595, LAS: 0.9241, UEM: 0.6436, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3721, partial_loss/deprel_loss: 0.3770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5400, loss: 0.5536, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||: 100%|##########| 111/111 [01:16<00:00, 1.45it/s]\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.377 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.372 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - reg_loss | 0.164 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UEM | 0.644 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LAS | 0.924 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - loss | 0.554 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEM | 0.423 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UAS | 0.959 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EM | 0.922 | N/A\n", + "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:22:38,121 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:22:45,590 - INFO - combo.training.trainer - Epoch duration: 0:01:26.971396\n", + "2023-04-07 01:22:45,591 - INFO - combo.training.trainer - Estimated training time remaining: 6:33:21\n", + "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Epoch 112/399\n", + "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:22:45,592 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:22:45,602 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9465, LAS: 0.9113, UEM: 0.3516, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9347, partial_loss/deprel_loss: 0.5649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8029, loss: 0.6429, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 3%|2 | 3/111 [00:02<01:18, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9502, LAS: 0.9139, UEM: 0.4979, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7445, loss: 0.6125, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 5%|5 | 6/111 [00:04<01:16, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9543, LAS: 0.9171, UEM: 0.5289, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2015, partial_loss/deprel_loss: 0.3542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5984, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 9%|9 | 10/111 [00:06<01:10, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9520, LAS: 0.9153, UEM: 0.4784, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6202, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 13%|#2 | 14/111 [00:09<01:06, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9533, LAS: 0.9172, UEM: 0.5065, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1862, partial_loss/deprel_loss: 0.3066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4465, loss: 0.6082, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 16%|#6 | 18/111 [00:12<01:03, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9527, LAS: 0.9165, UEM: 0.5070, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8457, partial_loss/deprel_loss: 0.5729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7914, loss: 0.6121, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||: 19%|#8 | 21/111 [00:14<01:04, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9537, LAS: 0.9181, UEM: 0.5409, LEM: 0.3272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3244, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.6005, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 22%|##1 | 24/111 [00:16<01:03, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9403, UAS: 0.9540, LAS: 0.9189, UEM: 0.5440, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5944, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 24%|##4 | 27/111 [00:19<01:01, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9564, LAS: 0.9210, UEM: 0.5942, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.2766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5804, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 27%|##7 | 30/111 [00:21<00:58, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9571, LAS: 0.9218, UEM: 0.6062, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6015, loss: 0.5729, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 30%|##9 | 33/111 [00:23<00:56, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9579, LAS: 0.9227, UEM: 0.6108, LEM: 0.3877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5635, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 33%|###3 | 37/111 [00:25<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9576, LAS: 0.9225, UEM: 0.6093, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7147, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.5641, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 36%|###6 | 40/111 [00:28<00:52, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9577, LAS: 0.9223, UEM: 0.6054, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5653, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||: 39%|###8 | 43/111 [00:30<00:49, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9583, LAS: 0.9233, UEM: 0.6294, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0886, partial_loss/deprel_loss: 0.1720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3192, loss: 0.5584, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||: 41%|####1 | 46/111 [00:32<00:47, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9586, LAS: 0.9236, UEM: 0.6407, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3458, loss: 0.5557, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||: 45%|####5 | 50/111 [00:35<00:43, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9588, LAS: 0.9235, UEM: 0.6325, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.5578, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||: 49%|####8 | 54/111 [00:37<00:38, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9588, LAS: 0.9236, UEM: 0.6321, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1250, partial_loss/deprel_loss: 0.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3891, loss: 0.5572, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||: 51%|#####1 | 57/111 [00:39<00:36, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9582, LAS: 0.9231, UEM: 0.6267, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2787, partial_loss/deprel_loss: 0.2862, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4485, loss: 0.5608, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 55%|#####4 | 61/111 [00:42<00:33, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9581, LAS: 0.9230, UEM: 0.6202, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5626, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 59%|#####8 | 65/111 [00:45<00:30, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9577, LAS: 0.9226, UEM: 0.6181, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5654, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 61%|######1 | 68/111 [00:47<00:29, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9583, LAS: 0.9231, UEM: 0.6201, LEM: 0.3982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 64%|######3 | 71/111 [00:49<00:27, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9581, LAS: 0.9230, UEM: 0.6127, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4975, partial_loss/deprel_loss: 0.4292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6067, loss: 0.5656, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 67%|######6 | 74/111 [00:51<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9583, LAS: 0.9234, UEM: 0.6134, LEM: 0.3913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 70%|####### | 78/111 [00:54<00:22, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9589, LAS: 0.9240, UEM: 0.6244, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1680, partial_loss/deprel_loss: 0.2197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3732, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 73%|#######2 | 81/111 [00:56<00:20, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9588, LAS: 0.9238, UEM: 0.6206, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2257, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 77%|#######6 | 85/111 [00:59<00:18, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9595, LAS: 0.9246, UEM: 0.6336, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.3525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.5523, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 80%|######## | 89/111 [01:01<00:14, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9602, LAS: 0.9254, UEM: 0.6529, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1587, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.5475, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 84%|########3 | 93/111 [01:05<00:13, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9599, LAS: 0.9252, UEM: 0.6513, LEM: 0.4335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1936, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5494, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||: 86%|########6 | 96/111 [01:07<00:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9597, LAS: 0.9249, UEM: 0.6490, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2162, partial_loss/deprel_loss: 0.3828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.5507, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 90%|######### | 100/111 [01:09<00:07, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9595, LAS: 0.9246, UEM: 0.6438, LEM: 0.4233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.5532, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 95%|#########4| 105/111 [01:11<00:03, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9597, LAS: 0.9248, UEM: 0.6440, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5283, loss: 0.5515, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 99%|#########9| 110/111 [01:13<00:00, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9597, LAS: 0.9249, UEM: 0.6435, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4962, loss: 0.5510, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 01:24:02,965 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.345 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.282 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - reg_loss | 0.164 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UEM | 0.644 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - LAS | 0.925 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - loss | 0.551 | N/A\n", + "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEM | 0.423 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EM | 0.931 | N/A\n", + "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:24:02,972 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:24:08,115 - INFO - combo.training.trainer - Epoch duration: 0:01:22.524054\n", + "2023-04-07 01:24:08,116 - INFO - combo.training.trainer - Estimated training time remaining: 6:32:00\n", + "2023-04-07 01:24:08,116 - INFO - allennlp.training.trainer - Epoch 113/399\n", + "2023-04-07 01:24:08,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:24:08,120 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:24:08,127 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9435, LAS: 0.9077, UEM: 0.5920, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4211, loss: 0.6665, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 3%|2 | 3/111 [00:02<01:18, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9525, LAS: 0.9181, UEM: 0.6117, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.3963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.5999, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 5%|5 | 6/111 [00:04<01:14, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9566, LAS: 0.9209, UEM: 0.6403, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1369, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5777, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 8%|8 | 9/111 [00:06<01:12, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9597, LAS: 0.9256, UEM: 0.6848, LEM: 0.4760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0767, partial_loss/deprel_loss: 0.1787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3220, loss: 0.5496, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 11%|# | 12/111 [00:08<01:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9600, LAS: 0.9256, UEM: 0.6684, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.5426, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 14%|#3 | 15/111 [00:10<01:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9572, LAS: 0.9225, UEM: 0.6189, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7275, loss: 0.5690, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 17%|#7 | 19/111 [00:13<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9574, LAS: 0.9231, UEM: 0.6233, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.5615, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||: 21%|## | 23/111 [00:15<00:57, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9573, LAS: 0.9233, UEM: 0.6406, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0529, partial_loss/deprel_loss: 0.5422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 0.5586, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 24%|##4 | 27/111 [00:18<00:54, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9564, LAS: 0.9221, UEM: 0.6399, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5640, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 27%|##7 | 30/111 [00:20<00:54, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9571, LAS: 0.9223, UEM: 0.6434, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 0.2758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4173, loss: 0.5608, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 30%|##9 | 33/111 [00:22<00:52, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9564, LAS: 0.9217, UEM: 0.6241, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6261, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5668, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 32%|###2 | 36/111 [00:24<00:51, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9566, LAS: 0.9218, UEM: 0.6162, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3270, partial_loss/deprel_loss: 0.3358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4977, loss: 0.5653, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 35%|###5 | 39/111 [00:26<00:50, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9567, LAS: 0.9220, UEM: 0.6088, LEM: 0.3970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6791, partial_loss/deprel_loss: 0.4889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6906, loss: 0.5671, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 38%|###7 | 42/111 [00:28<00:49, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9564, LAS: 0.9216, UEM: 0.6039, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5713, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 41%|####1 | 46/111 [00:31<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9572, LAS: 0.9224, UEM: 0.6089, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.4346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.5652, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||: 45%|####5 | 50/111 [00:34<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9569, LAS: 0.9224, UEM: 0.6093, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7306, partial_loss/deprel_loss: 0.5466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7470, loss: 0.5666, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||: 49%|####8 | 54/111 [00:36<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9574, LAS: 0.9229, UEM: 0.6208, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6644, loss: 0.5625, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9579, LAS: 0.9234, UEM: 0.6257, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.5590, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||: 54%|#####4 | 60/111 [00:41<00:35, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9586, LAS: 0.9242, UEM: 0.6372, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3923, loss: 0.5533, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||: 57%|#####6 | 63/111 [00:43<00:36, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9583, LAS: 0.9240, UEM: 0.6283, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5295, loss: 0.5554, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 60%|###### | 67/111 [00:46<00:31, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9595, LAS: 0.9252, UEM: 0.6533, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3758, loss: 0.5470, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 63%|######3 | 70/111 [00:48<00:28, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9599, LAS: 0.9257, UEM: 0.6554, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1910, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 66%|######5 | 73/111 [00:50<00:28, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9596, LAS: 0.9254, UEM: 0.6500, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5300, loss: 0.5468, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 69%|######9 | 77/111 [00:53<00:24, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9601, LAS: 0.9257, UEM: 0.6518, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1751, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 73%|#######2 | 81/111 [00:55<00:19, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9595, LAS: 0.9250, UEM: 0.6442, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8791, partial_loss/deprel_loss: 0.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8142, loss: 0.5483, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 77%|#######7 | 86/111 [00:57<00:14, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9598, LAS: 0.9254, UEM: 0.6547, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.5463, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 81%|########1 | 90/111 [01:00<00:13, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9604, LAS: 0.9259, UEM: 0.6577, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.5433, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||: 85%|########4 | 94/111 [01:02<00:10, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9602, LAS: 0.9256, UEM: 0.6506, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4410, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.5457, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 88%|########8 | 98/111 [01:05<00:07, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9604, LAS: 0.9258, UEM: 0.6540, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5434, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 92%|#########1| 102/111 [01:07<00:05, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9605, LAS: 0.9260, UEM: 0.6514, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3090, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4792, loss: 0.5419, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 96%|#########6| 107/111 [01:10<00:02, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9601, LAS: 0.9256, UEM: 0.6451, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4750, partial_loss/deprel_loss: 0.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6263, loss: 0.5441, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 100%|##########| 111/111 [01:12<00:00, 1.54it/s]\n", + "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.460 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.475 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - reg_loss | 0.164 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UEM | 0.645 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - loss | 0.544 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEM | 0.427 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UAS | 0.960 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EM | 0.915 | N/A\n", + "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:25:23,472 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Epoch duration: 0:01:20.340225\n", + "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Estimated training time remaining: 6:30:34\n", + "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Epoch 114/399\n", + "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:25:28,466 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9547, LAS: 0.9186, UEM: 0.4273, LEM: 0.1939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.4807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6056, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||: 3%|2 | 3/111 [00:02<01:21, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9578, LAS: 0.9234, UEM: 0.4774, LEM: 0.2359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5772, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||: 5%|5 | 6/111 [00:04<01:18, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9633, LAS: 0.9302, UEM: 0.5858, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.5286, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||: 9%|9 | 10/111 [00:06<01:11, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9626, LAS: 0.9286, UEM: 0.6194, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5775, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6829, loss: 0.5309, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||: 13%|#2 | 14/111 [00:09<01:05, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9637, LAS: 0.9305, UEM: 0.6935, LEM: 0.4949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4562, loss: 0.5180, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||: 15%|#5 | 17/111 [00:11<01:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9644, LAS: 0.9308, UEM: 0.6832, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3690, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5159, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 19%|#8 | 21/111 [00:14<01:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9633, LAS: 0.9294, UEM: 0.6628, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6813, partial_loss/deprel_loss: 0.5702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.5264, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 22%|##1 | 24/111 [00:16<01:00, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9644, LAS: 0.9303, UEM: 0.6832, LEM: 0.4702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0925, partial_loss/deprel_loss: 0.2237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3608, loss: 0.5173, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 24%|##4 | 27/111 [00:18<00:58, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9624, LAS: 0.9282, UEM: 0.6623, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4599, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6204, loss: 0.5314, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 27%|##7 | 30/111 [00:20<00:56, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9620, LAS: 0.9284, UEM: 0.6473, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.4161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.5333, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 31%|### | 34/111 [00:23<00:51, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9632, LAS: 0.9297, UEM: 0.6585, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.5242, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||: 34%|###4 | 38/111 [00:25<00:48, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9289, UEM: 0.6467, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4360, loss: 0.5306, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||: 38%|###7 | 42/111 [00:28<00:46, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9616, LAS: 0.9279, UEM: 0.6359, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7707, partial_loss/deprel_loss: 0.5840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.5386, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||: 41%|#### | 45/111 [00:30<00:47, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9620, LAS: 0.9282, UEM: 0.6325, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2114, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5358, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||: 43%|####3 | 48/111 [00:33<00:45, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9617, LAS: 0.9280, UEM: 0.6243, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.5381, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||: 46%|####5 | 51/111 [00:35<00:44, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9617, LAS: 0.9280, UEM: 0.6325, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3666, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5340, loss: 0.5358, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 49%|####8 | 54/111 [00:37<00:41, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9615, LAS: 0.9277, UEM: 0.6346, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9003, partial_loss/deprel_loss: 0.5767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.5368, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 51%|#####1 | 57/111 [00:39<00:39, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9606, LAS: 0.9267, UEM: 0.6277, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8944, loss: 0.5447, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 54%|#####4 | 60/111 [00:42<00:37, 1.35it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9609, LAS: 0.9269, UEM: 0.6307, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4027, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.5431, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 57%|#####6 | 63/111 [00:44<00:36, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9607, LAS: 0.9267, UEM: 0.6229, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.5432, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 60%|###### | 67/111 [00:46<00:31, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9613, LAS: 0.9271, UEM: 0.6294, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1762, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4539, loss: 0.5403, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 63%|######3 | 70/111 [00:49<00:29, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9609, LAS: 0.9267, UEM: 0.6307, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5436, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 66%|######5 | 73/111 [00:51<00:26, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9613, LAS: 0.9272, UEM: 0.6381, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2478, partial_loss/deprel_loss: 0.3511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.5398, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 68%|######8 | 76/111 [00:53<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9614, LAS: 0.9272, UEM: 0.6402, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.4691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.5406, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 72%|#######2 | 80/111 [00:55<00:20, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9616, LAS: 0.9273, UEM: 0.6387, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5391, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 76%|#######5 | 84/111 [00:57<00:17, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9616, LAS: 0.9271, UEM: 0.6359, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6056, partial_loss/deprel_loss: 0.4984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.5388, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 80%|######## | 89/111 [01:00<00:13, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9613, LAS: 0.9268, UEM: 0.6340, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3948, loss: 0.5409, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||: 85%|########4 | 94/111 [01:02<00:09, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9607, LAS: 0.9261, UEM: 0.6273, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4857, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 89%|########9 | 99/111 [01:05<00:06, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9608, LAS: 0.9263, UEM: 0.6391, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 0.5438, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 93%|#########2| 103/111 [01:07<00:04, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9606, LAS: 0.9262, UEM: 0.6421, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3545, partial_loss/deprel_loss: 0.4660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 96%|#########6| 107/111 [01:10<00:02, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.265 | N/A\n", + "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.228 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - reg_loss | 0.163 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UEM | 0.646 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - loss | 0.542 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEM | 0.423 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EM | 0.937 | N/A\n", + "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:26:44,764 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Epoch duration: 0:01:21.342111\n", + "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Estimated training time remaining: 6:29:11\n", + "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Epoch 115/399\n", + "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:26:49,800 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:26:49,811 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9547, LAS: 0.9173, UEM: 0.3925, LEM: 0.1752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3871, partial_loss/deprel_loss: 0.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.5949, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 4%|3 | 4/111 [00:02<01:03, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9608, LAS: 0.9239, UEM: 0.6031, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3876, loss: 0.5477, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 6%|6 | 7/111 [00:04<01:06, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9610, LAS: 0.9251, UEM: 0.6085, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.3027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4560, loss: 0.5365, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 9%|9 | 10/111 [00:06<01:05, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9606, LAS: 0.9248, UEM: 0.5913, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5387, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 13%|#2 | 14/111 [00:09<01:02, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9561, LAS: 0.9205, UEM: 0.5787, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 0.5953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8343, loss: 0.5763, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 16%|#6 | 18/111 [00:11<01:00, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9571, LAS: 0.9214, UEM: 0.5802, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4454, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5991, loss: 0.5686, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||: 19%|#8 | 21/111 [00:13<00:59, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9558, LAS: 0.9203, UEM: 0.5699, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.5225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7381, loss: 0.5809, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 23%|##2 | 25/111 [00:16<00:54, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9560, LAS: 0.9204, UEM: 0.5712, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7270, loss: 0.5789, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 26%|##6 | 29/111 [00:18<00:52, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9562, LAS: 0.9205, UEM: 0.5662, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4325, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5776, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 29%|##8 | 32/111 [00:20<00:51, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9567, LAS: 0.9210, UEM: 0.5642, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5532, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.5761, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 32%|###2 | 36/111 [00:23<00:48, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9577, LAS: 0.9227, UEM: 0.5645, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4949, loss: 0.5676, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 36%|###6 | 40/111 [00:25<00:44, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9593, LAS: 0.9242, UEM: 0.6023, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.2403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3885, loss: 0.5565, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||: 40%|###9 | 44/111 [00:28<00:42, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9598, LAS: 0.9247, UEM: 0.6098, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1807, partial_loss/deprel_loss: 0.3618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5529, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||: 43%|####3 | 48/111 [00:30<00:39, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9600, LAS: 0.9249, UEM: 0.6152, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8968, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5531, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||: 47%|####6 | 52/111 [00:33<00:38, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9760, UAS: 0.9603, LAS: 0.9255, UEM: 0.6436, LEM: 0.4230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0247, partial_loss/deprel_loss: 0.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2363, loss: 0.5484, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||: 50%|##### | 56/111 [00:37<00:40, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9613, LAS: 0.9268, UEM: 0.6714, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0662, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2913, loss: 0.5381, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||: 53%|#####3 | 59/111 [00:39<00:40, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9611, LAS: 0.9266, UEM: 0.6727, LEM: 0.4602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1327, partial_loss/deprel_loss: 0.2068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3549, loss: 0.5380, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 57%|#####6 | 63/111 [00:42<00:37, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9608, LAS: 0.9264, UEM: 0.6661, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5401, loss: 0.5396, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 59%|#####9 | 66/111 [00:45<00:33, 1.33it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9610, LAS: 0.9265, UEM: 0.6630, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1927, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.5398, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 64%|######3 | 71/111 [00:47<00:26, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9604, LAS: 0.9259, UEM: 0.6528, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7439, partial_loss/deprel_loss: 0.5034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7144, loss: 0.5445, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 68%|######8 | 76/111 [00:49<00:21, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9600, LAS: 0.9254, UEM: 0.6427, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6552, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.5482, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 73%|#######2 | 81/111 [00:52<00:17, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9605, LAS: 0.9259, UEM: 0.6488, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4177, loss: 0.5444, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 77%|#######6 | 85/111 [00:54<00:14, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9603, LAS: 0.9255, UEM: 0.6422, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4813, loss: 0.5465, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 80%|######## | 89/111 [00:57<00:13, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9602, LAS: 0.9253, UEM: 0.6407, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5308, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6338, loss: 0.5477, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 84%|########3 | 93/111 [01:00<00:12, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9604, LAS: 0.9255, UEM: 0.6448, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1062, partial_loss/deprel_loss: 0.2317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.5461, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||: 87%|########7 | 97/111 [01:03<00:09, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9604, LAS: 0.9255, UEM: 0.6440, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7574, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7189, loss: 0.5467, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 91%|######### | 101/111 [01:06<00:06, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9607, LAS: 0.9259, UEM: 0.6425, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5342, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 95%|#########4| 105/111 [01:09<00:04, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9607, LAS: 0.9259, UEM: 0.6409, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4736, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 98%|#########8| 109/111 [01:11<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9610, LAS: 0.9262, UEM: 0.6476, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0943, partial_loss/deprel_loss: 0.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3463, loss: 0.5421, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 100%|##########| 111/111 [01:13<00:00, 1.52it/s]\n", + "2023-04-07 01:28:05,803 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9357, LAS: 0.8788, UEM: 0.3387, LEM: 0.0753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9730, partial_loss/deprel_loss: 35.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 28.5853, loss: 31.0780, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:12, 1.09s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9552, LAS: 0.9039, UEM: 0.6997, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 22.8051, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2725, loss: 25.2398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 31%|### | 4/13 [00:04<00:09, 1.09s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9505, LAS: 0.9004, UEM: 0.6364, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7520, partial_loss/deprel_loss: 28.9441, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3056, loss: 25.0064, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 54%|#####3 | 7/13 [00:07<00:06, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9546, LAS: 0.9063, UEM: 0.7099, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5701, partial_loss/deprel_loss: 23.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9172, loss: 23.1846, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:09<00:04, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9528, LAS: 0.9035, UEM: 0.6763, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7413, partial_loss/deprel_loss: 33.2838, partial_loss/cycle_loss: 0.0000, batch_loss: 26.7753, loss: 23.2175, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 92%|#########2| 12/13 [00:11<00:00, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9483, LAS: 0.8987, UEM: 0.6599, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6642, partial_loss/deprel_loss: 54.1649, partial_loss/cycle_loss: 0.0000, batch_loss: 43.6647, loss: 24.7903, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.00it/s]\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - patience | 5.000 | N/A\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.206 | 54.165\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.094 | 1.664\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - reg_loss | 0.163 | 0.000\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UEM | 0.648 | 0.660\n", + "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - LAS | 0.926 | 0.899\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - loss | 0.542 | 24.790\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEM | 0.431 | 0.396\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | 0.948\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EM | 0.949 | 0.841\n", + "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:28:18,783 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:28:23,018 - INFO - combo.training.trainer - Epoch duration: 0:01:33.219014\n", + "2023-04-07 01:28:23,019 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:17\n", + "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Epoch 116/399\n", + "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:28:23,020 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:28:23,029 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9574, LAS: 0.9219, UEM: 0.5537, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5787, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 4%|3 | 4/111 [00:02<01:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9581, LAS: 0.9241, UEM: 0.5307, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6387, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6399, loss: 0.5651, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 7%|7 | 8/111 [00:05<01:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9591, LAS: 0.9241, UEM: 0.5168, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4099, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.5604, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 10%|9 | 11/111 [00:07<01:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9567, LAS: 0.9219, UEM: 0.5284, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.5698, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 13%|#2 | 14/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9564, LAS: 0.9219, UEM: 0.5200, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3841, partial_loss/deprel_loss: 0.3641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5309, loss: 0.5723, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 15%|#5 | 17/111 [00:11<01:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9589, LAS: 0.9248, UEM: 0.6190, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5315, loss: 0.5545, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 18%|#8 | 20/111 [00:14<01:06, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9577, LAS: 0.9236, UEM: 0.6216, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5082, partial_loss/deprel_loss: 0.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6282, loss: 0.5616, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||: 21%|## | 23/111 [00:16<01:07, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9595, LAS: 0.9256, UEM: 0.6471, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1424, partial_loss/deprel_loss: 0.2302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3754, loss: 0.5457, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||: 23%|##3 | 26/111 [00:19<01:07, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9588, LAS: 0.9249, UEM: 0.6298, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3933, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5796, loss: 0.5488, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||: 26%|##6 | 29/111 [00:21<01:02, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9606, LAS: 0.9268, UEM: 0.6540, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3722, partial_loss/deprel_loss: 0.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4956, loss: 0.5388, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||: 30%|##9 | 33/111 [00:23<00:54, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9612, LAS: 0.9271, UEM: 0.6495, LEM: 0.4434, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1959, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.5359, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||: 34%|###4 | 38/111 [00:26<00:47, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9500, UAS: 0.9614, LAS: 0.9273, UEM: 0.6543, LEM: 0.4509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1142, partial_loss/deprel_loss: 0.1998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3453, loss: 0.5354, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||: 39%|###8 | 43/111 [00:28<00:40, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9616, LAS: 0.9277, UEM: 0.6489, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2601, partial_loss/deprel_loss: 0.3257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4753, loss: 0.5345, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||: 43%|####3 | 48/111 [00:31<00:35, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9621, LAS: 0.9282, UEM: 0.6544, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1851, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5299, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||: 47%|####6 | 52/111 [00:33<00:35, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9624, LAS: 0.9282, UEM: 0.6494, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3444, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.5285, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||: 50%|##### | 56/111 [00:36<00:35, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9284, UEM: 0.6518, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2388, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5269, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 54%|#####4 | 60/111 [00:40<00:36, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9629, LAS: 0.9288, UEM: 0.6697, LEM: 0.4579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0658, partial_loss/deprel_loss: 0.1754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3161, loss: 0.5245, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 58%|#####7 | 64/111 [00:43<00:33, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9629, LAS: 0.9286, UEM: 0.6671, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4276, loss: 0.5241, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 61%|######1 | 68/111 [00:45<00:29, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9630, LAS: 0.9289, UEM: 0.6664, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5225, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 65%|######4 | 72/111 [00:48<00:25, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9620, LAS: 0.9276, UEM: 0.6565, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6533, loss: 0.5320, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 68%|######8 | 76/111 [00:50<00:23, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9617, LAS: 0.9273, UEM: 0.6535, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8500, partial_loss/deprel_loss: 0.5179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7469, loss: 0.5336, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 72%|#######2 | 80/111 [00:53<00:20, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9613, LAS: 0.9271, UEM: 0.6508, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5955, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5355, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 76%|#######5 | 84/111 [00:56<00:18, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9606, LAS: 0.9264, UEM: 0.6449, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3222, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5414, loss: 0.5413, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 79%|#######9 | 88/111 [00:58<00:15, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9608, LAS: 0.9267, UEM: 0.6465, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.5395, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 83%|########2 | 92/111 [01:01<00:12, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9609, LAS: 0.9267, UEM: 0.6496, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7109, partial_loss/deprel_loss: 0.4976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7028, loss: 0.5385, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||: 86%|########6 | 96/111 [01:04<00:10, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9610, LAS: 0.9268, UEM: 0.6488, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6543, partial_loss/deprel_loss: 0.4789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6765, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 90%|######### | 100/111 [01:06<00:07, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9608, LAS: 0.9266, UEM: 0.6439, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2691, partial_loss/deprel_loss: 0.3528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4986, loss: 0.5396, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 93%|#########2| 103/111 [01:08<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9610, LAS: 0.9268, UEM: 0.6465, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1619, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 96%|#########6| 107/111 [01:11<00:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9608, LAS: 0.9265, UEM: 0.6469, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1204, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5391, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 99%|#########9| 110/111 [01:13<00:00, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9609, LAS: 0.9266, UEM: 0.6485, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4372, loss: 0.5382, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.293 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.202 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - reg_loss | 0.163 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UEM | 0.649 | N/A\n", + "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - loss | 0.538 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEM | 0.431 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - EM | 0.938 | N/A\n", + "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:29:40,447 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Epoch duration: 0:01:22.264978\n", + "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:26:55\n", + "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Epoch 117/399\n", + "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:29:45,286 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:29:45,297 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9410, LAS: 0.9072, UEM: 0.2115, LEM: 0.0673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0066, partial_loss/deprel_loss: 0.4922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7576, loss: 0.6695, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 3%|2 | 3/111 [00:02<01:16, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9573, LAS: 0.9234, UEM: 0.6225, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5587, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 5%|5 | 6/111 [00:04<01:13, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9597, LAS: 0.9265, UEM: 0.6303, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.2943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.5306, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9618, LAS: 0.9290, UEM: 0.6422, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3256, partial_loss/deprel_loss: 0.3279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4899, loss: 0.5178, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 13%|#2 | 14/111 [00:09<01:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9631, LAS: 0.9301, UEM: 0.6359, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.3239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4711, loss: 0.5122, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 16%|#6 | 18/111 [00:11<00:57, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9630, LAS: 0.9298, UEM: 0.6229, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3032, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.5102, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||: 21%|## | 23/111 [00:13<00:50, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9634, LAS: 0.9309, UEM: 0.6398, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1709, partial_loss/deprel_loss: 0.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4053, loss: 0.5038, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||: 25%|##5 | 28/111 [00:15<00:43, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9632, LAS: 0.9309, UEM: 0.6331, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5536, loss: 0.5060, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||: 29%|##8 | 32/111 [00:17<00:41, 1.91it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9632, LAS: 0.9312, UEM: 0.6660, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0344, partial_loss/deprel_loss: 0.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2474, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||: 32%|###2 | 36/111 [00:21<00:46, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9313, UEM: 0.6693, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4329, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6159, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||: 36%|###6 | 40/111 [00:23<00:45, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9626, LAS: 0.9303, UEM: 0.6647, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6834, loss: 0.5078, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||: 40%|###9 | 44/111 [00:26<00:45, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9623, LAS: 0.9300, UEM: 0.6570, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5114, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||: 43%|####3 | 48/111 [00:29<00:42, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9624, LAS: 0.9300, UEM: 0.6613, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5246, partial_loss/deprel_loss: 0.4793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6507, loss: 0.5130, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||: 47%|####6 | 52/111 [00:32<00:39, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9625, LAS: 0.9299, UEM: 0.6535, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3355, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5163, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||: 50%|##### | 56/111 [00:34<00:34, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9621, LAS: 0.9293, UEM: 0.6491, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1408, partial_loss/deprel_loss: 0.2545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5204, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||: 54%|#####4 | 60/111 [00:37<00:32, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9619, LAS: 0.9290, UEM: 0.6429, LEM: 0.4245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4904, loss: 0.5217, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 58%|#####7 | 64/111 [00:39<00:31, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9610, LAS: 0.9281, UEM: 0.6440, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0708, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5269, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 61%|######1 | 68/111 [00:42<00:29, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9601, LAS: 0.9271, UEM: 0.6366, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.5337, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 64%|######3 | 71/111 [00:44<00:27, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9602, LAS: 0.9270, UEM: 0.6335, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5353, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 67%|######6 | 74/111 [00:47<00:26, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9603, LAS: 0.9271, UEM: 0.6388, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.4509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.5350, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 69%|######9 | 77/111 [00:49<00:24, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9606, LAS: 0.9274, UEM: 0.6483, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6415, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7376, loss: 0.5339, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 72%|#######2 | 80/111 [00:51<00:22, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9608, LAS: 0.9275, UEM: 0.6506, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5326, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 75%|#######4 | 83/111 [00:53<00:20, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9612, LAS: 0.9277, UEM: 0.6555, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2927, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4874, loss: 0.5298, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 78%|#######8 | 87/111 [00:56<00:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9611, LAS: 0.9276, UEM: 0.6540, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6455, partial_loss/deprel_loss: 0.5085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.5311, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 81%|########1 | 90/111 [00:58<00:15, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9606, LAS: 0.9271, UEM: 0.6474, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6479, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.5349, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 85%|########4 | 94/111 [01:01<00:11, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9608, LAS: 0.9273, UEM: 0.6451, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3137, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5164, loss: 0.5347, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 87%|########7 | 97/111 [01:03<00:09, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9607, LAS: 0.9271, UEM: 0.6447, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3215, partial_loss/deprel_loss: 0.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5683, loss: 0.5362, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 90%|######### | 100/111 [01:05<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9605, LAS: 0.9269, UEM: 0.6461, LEM: 0.4320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1824, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3796, loss: 0.5365, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 93%|#########2| 103/111 [01:07<00:05, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9608, LAS: 0.9272, UEM: 0.6491, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5345, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||: 95%|#########5| 106/111 [01:10<00:03, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9608, LAS: 0.9271, UEM: 0.6473, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4784, loss: 0.5352, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||: 99%|#########9| 110/111 [01:12<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9608, LAS: 0.9271, UEM: 0.6470, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.3751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5351, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.375 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.320 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - reg_loss | 0.162 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UEM | 0.647 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - loss | 0.535 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEM | 0.430 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EM | 0.933 | N/A\n", + "2023-04-07 01:31:01,942 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:31:01,947 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:31:06,980 - INFO - combo.training.trainer - Epoch duration: 0:01:21.695775\n", + "2023-04-07 01:31:06,981 - INFO - combo.training.trainer - Estimated training time remaining: 6:25:32\n", + "2023-04-07 01:31:06,981 - INFO - allennlp.training.trainer - Epoch 118/399\n", + "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:31:06,992 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9584, LAS: 0.9244, UEM: 0.5742, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.5838, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 5%|4 | 5/111 [00:02<00:49, 2.13it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9661, LAS: 0.9330, UEM: 0.6756, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2489, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5024, loss: 0.5213, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 8%|8 | 9/111 [00:05<00:53, 1.89it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9642, LAS: 0.9312, UEM: 0.6472, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4661, loss: 0.5239, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 12%|#1 | 13/111 [00:07<00:54, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9629, LAS: 0.9304, UEM: 0.6386, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6097, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6417, loss: 0.5277, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 15%|#5 | 17/111 [00:10<00:55, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9627, LAS: 0.9306, UEM: 0.6374, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4281, partial_loss/deprel_loss: 0.3719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.5259, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 19%|#8 | 21/111 [00:12<00:54, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9302, UEM: 0.6381, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.4099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5824, loss: 0.5261, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 23%|##3 | 26/111 [00:15<00:47, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9630, LAS: 0.9303, UEM: 0.6479, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3967, loss: 0.5214, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||: 28%|##7 | 31/111 [00:17<00:42, 1.87it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9633, LAS: 0.9307, UEM: 0.6835, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9265, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8041, loss: 0.5189, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 32%|###1 | 35/111 [00:20<00:45, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9635, LAS: 0.9309, UEM: 0.6790, LEM: 0.4666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.5163, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 35%|###5 | 39/111 [00:23<00:48, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9644, LAS: 0.9317, UEM: 0.7036, LEM: 0.4959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0596, partial_loss/deprel_loss: 0.1671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3077, loss: 0.5090, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 38%|###7 | 42/111 [00:26<00:49, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9646, LAS: 0.9317, UEM: 0.6970, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4318, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.5093, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 41%|####1 | 46/111 [00:28<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9643, LAS: 0.9313, UEM: 0.6905, LEM: 0.4775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2069, partial_loss/deprel_loss: 0.3115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5109, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 44%|####4 | 49/111 [00:30<00:42, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9647, LAS: 0.9317, UEM: 0.6980, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0849, partial_loss/deprel_loss: 0.1925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3331, loss: 0.5082, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 47%|####6 | 52/111 [00:33<00:41, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9636, LAS: 0.9306, UEM: 0.6847, LEM: 0.4741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7901, partial_loss/deprel_loss: 0.4558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.5165, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 50%|##### | 56/111 [00:35<00:37, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9637, LAS: 0.9306, UEM: 0.6816, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4952, loss: 0.5146, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 53%|#####3 | 59/111 [00:37<00:35, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9631, LAS: 0.9296, UEM: 0.6729, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3769, partial_loss/deprel_loss: 0.4646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.5212, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||: 56%|#####5 | 62/111 [00:39<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9633, LAS: 0.9297, UEM: 0.6692, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2217, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.5206, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||: 59%|#####9 | 66/111 [00:41<00:28, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9627, LAS: 0.9290, UEM: 0.6628, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6047, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6637, loss: 0.5258, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 63%|######3 | 70/111 [00:45<00:28, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9625, LAS: 0.9287, UEM: 0.6564, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5930, loss: 0.5275, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 66%|######5 | 73/111 [00:47<00:26, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9627, LAS: 0.9290, UEM: 0.6556, LEM: 0.4382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3633, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5013, loss: 0.5263, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 69%|######9 | 77/111 [00:49<00:22, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9630, LAS: 0.9293, UEM: 0.6552, LEM: 0.4360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2212, partial_loss/deprel_loss: 0.2669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5241, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 73%|#######2 | 81/111 [00:52<00:20, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9634, LAS: 0.9297, UEM: 0.6572, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1872, partial_loss/deprel_loss: 0.2738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5218, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 77%|#######6 | 85/111 [00:54<00:17, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9632, LAS: 0.9295, UEM: 0.6530, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2652, partial_loss/deprel_loss: 0.3209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4717, loss: 0.5238, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 80%|######## | 89/111 [00:57<00:14, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9628, LAS: 0.9290, UEM: 0.6508, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5269, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 84%|########3 | 93/111 [01:00<00:12, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9627, LAS: 0.9289, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.2665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.5265, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 87%|########7 | 97/111 [01:03<00:10, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9625, LAS: 0.9288, UEM: 0.6574, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4383, partial_loss/deprel_loss: 0.4457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6062, loss: 0.5284, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 90%|######### | 100/111 [01:05<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9621, LAS: 0.9284, UEM: 0.6529, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7947, loss: 0.5315, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 93%|#########2| 103/111 [01:07<00:05, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9622, LAS: 0.9286, UEM: 0.6580, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5416, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.5292, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||: 95%|#########5| 106/111 [01:10<00:03, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9617, LAS: 0.9280, UEM: 0.6534, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0117, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7853, loss: 0.5327, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||: 99%|#########9| 110/111 [01:13<00:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9615, LAS: 0.9277, UEM: 0.6512, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6477, partial_loss/deprel_loss: 0.5848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7593, loss: 0.5348, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.585 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.648 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - reg_loss | 0.162 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UEM | 0.651 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - loss | 0.535 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEM | 0.432 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EM | 0.901 | N/A\n", + "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:32:24,083 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:32:29,151 - INFO - combo.training.trainer - Epoch duration: 0:01:22.169650\n", + "2023-04-07 01:32:29,152 - INFO - combo.training.trainer - Estimated training time remaining: 6:24:11\n", + "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Epoch 119/399\n", + "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:32:29,162 - INFO - allennlp.training.trainer - Training\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9560, LAS: 0.9230, UEM: 0.6512, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.4480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6467, loss: 0.5886, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 5%|4 | 5/111 [00:02<00:52, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9547, LAS: 0.9204, UEM: 0.5686, LEM: 0.3328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9893, partial_loss/deprel_loss: 0.5484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.5991, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 9%|9 | 10/111 [00:04<00:49, 2.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9562, LAS: 0.9221, UEM: 0.5881, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6123, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6141, loss: 0.5779, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 14%|#3 | 15/111 [00:07<00:46, 2.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9558, LAS: 0.9221, UEM: 0.5655, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3024, partial_loss/deprel_loss: 0.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5763, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 17%|#7 | 19/111 [00:09<00:49, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9567, LAS: 0.9229, UEM: 0.5671, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4757, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5670, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 21%|## | 23/111 [00:12<00:49, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9571, LAS: 0.9234, UEM: 0.6038, LEM: 0.3925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2781, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5615, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 23%|##3 | 26/111 [00:14<00:53, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9594, LAS: 0.9259, UEM: 0.6656, LEM: 0.4674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0312, partial_loss/deprel_loss: 0.1093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.5430, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 26%|##6 | 29/111 [00:17<00:56, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9607, LAS: 0.9274, UEM: 0.6750, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4048, loss: 0.5329, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 29%|##8 | 32/111 [00:19<00:57, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9607, LAS: 0.9274, UEM: 0.6677, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4143, loss: 0.5330, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 32%|###1 | 35/111 [00:21<00:54, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9616, LAS: 0.9282, UEM: 0.6710, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5294, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||: 34%|###4 | 38/111 [00:23<00:51, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9621, LAS: 0.9284, UEM: 0.6754, LEM: 0.4638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5263, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 37%|###6 | 41/111 [00:25<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9617, LAS: 0.9280, UEM: 0.6783, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0769, partial_loss/deprel_loss: 0.2259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3580, loss: 0.5280, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 40%|###9 | 44/111 [00:27<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9621, LAS: 0.9284, UEM: 0.6747, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3800, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.5269, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 42%|####2 | 47/111 [00:29<00:44, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9608, LAS: 0.9271, UEM: 0.6570, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5127, partial_loss/deprel_loss: 0.4390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.5357, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 46%|####5 | 51/111 [00:32<00:41, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9614, LAS: 0.9277, UEM: 0.6581, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 50%|####9 | 55/111 [00:35<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9612, LAS: 0.9275, UEM: 0.6545, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 52%|#####2 | 58/111 [00:37<00:37, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9610, LAS: 0.9275, UEM: 0.6621, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5332, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 55%|#####4 | 61/111 [00:39<00:35, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9610, LAS: 0.9276, UEM: 0.6568, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3979, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5698, loss: 0.5333, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 58%|#####7 | 64/111 [00:42<00:34, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9608, LAS: 0.9273, UEM: 0.6518, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.3191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5350, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 60%|###### | 67/111 [00:44<00:31, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9607, LAS: 0.9271, UEM: 0.6513, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.3120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5358, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 63%|######3 | 70/111 [00:46<00:29, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9607, LAS: 0.9270, UEM: 0.6530, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4823, loss: 0.5351, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||: 67%|######6 | 74/111 [00:49<00:26, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9603, LAS: 0.9266, UEM: 0.6537, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.5373, batch_reg_loss: 0.1618, reg_loss: 0.1618 ||: 70%|####### | 78/111 [00:51<00:23, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9600, LAS: 0.9264, UEM: 0.6507, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7320, partial_loss/deprel_loss: 0.4751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6882, loss: 0.5391, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 73%|#######2 | 81/111 [00:54<00:22, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9596, LAS: 0.9260, UEM: 0.6459, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 0.5417, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 77%|#######6 | 85/111 [00:56<00:18, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9593, LAS: 0.9257, UEM: 0.6400, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5148, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6482, loss: 0.5443, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 79%|#######9 | 88/111 [00:59<00:16, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9596, LAS: 0.9261, UEM: 0.6410, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4468, loss: 0.5411, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 82%|########1 | 91/111 [01:01<00:14, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9600, LAS: 0.9265, UEM: 0.6463, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.5384, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 85%|########4 | 94/111 [01:03<00:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9601, LAS: 0.9266, UEM: 0.6469, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3405, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.5386, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 87%|########7 | 97/111 [01:05<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9602, LAS: 0.9266, UEM: 0.6479, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5201, partial_loss/deprel_loss: 0.4496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5378, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 90%|######### | 100/111 [01:07<00:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9606, LAS: 0.9270, UEM: 0.6509, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5157, partial_loss/deprel_loss: 0.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.5354, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 94%|#########3| 104/111 [01:09<00:04, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9607, LAS: 0.9271, UEM: 0.6519, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2124, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4618, loss: 0.5335, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 97%|#########7| 108/111 [01:12<00:02, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.272 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.251 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - reg_loss | 0.162 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UEM | 0.649 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LAS | 0.927 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - loss | 0.533 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEM | 0.435 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UAS | 0.961 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EM | 0.936 | N/A\n", + "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:33:46,623 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Epoch duration: 0:01:25.103205\n", + "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:56\n", + "2023-04-07 01:33:54,257 - INFO - allennlp.training.trainer - Epoch 120/399\n", + "2023-04-07 01:33:54,258 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:33:54,259 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:33:54,269 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9501, LAS: 0.9170, UEM: 0.5021, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8535, partial_loss/deprel_loss: 0.5228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7506, loss: 0.5918, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||: 4%|3 | 4/111 [00:02<01:01, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9531, LAS: 0.9200, UEM: 0.4871, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.5803, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||: 7%|7 | 8/111 [00:05<01:02, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9541, LAS: 0.9206, UEM: 0.5231, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6122, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.5758, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||: 10%|9 | 11/111 [00:07<01:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9580, LAS: 0.9244, UEM: 0.5806, LEM: 0.3570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3549, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5143, loss: 0.5547, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||: 13%|#2 | 14/111 [00:09<01:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9595, LAS: 0.9262, UEM: 0.5897, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5475, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6344, loss: 0.5433, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 16%|#6 | 18/111 [00:12<01:01, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9603, LAS: 0.9269, UEM: 0.5869, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5389, loss: 0.5377, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 20%|#9 | 22/111 [00:14<00:58, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9625, LAS: 0.9299, UEM: 0.6652, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0359, partial_loss/deprel_loss: 0.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5194, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 23%|##2 | 25/111 [00:17<01:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9603, LAS: 0.9278, UEM: 0.6394, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2706, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4722, loss: 0.5364, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 26%|##6 | 29/111 [00:19<00:55, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9608, LAS: 0.9282, UEM: 0.6520, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2792, partial_loss/deprel_loss: 0.3689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5125, loss: 0.5330, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 29%|##8 | 32/111 [00:21<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9617, LAS: 0.9292, UEM: 0.6638, LEM: 0.4631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6114, loss: 0.5262, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 32%|###2 | 36/111 [00:24<00:51, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9611, LAS: 0.9286, UEM: 0.6649, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4831, partial_loss/deprel_loss: 0.4557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.5295, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 36%|###6 | 40/111 [00:27<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9621, LAS: 0.9297, UEM: 0.6798, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.5221, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||: 39%|###8 | 43/111 [00:29<00:46, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9620, LAS: 0.9296, UEM: 0.6714, LEM: 0.4641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.5224, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 42%|####2 | 47/111 [00:31<00:42, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9619, LAS: 0.9292, UEM: 0.6658, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5552, partial_loss/deprel_loss: 0.4651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6446, loss: 0.5248, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 46%|####5 | 51/111 [00:34<00:40, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9615, LAS: 0.9288, UEM: 0.6645, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7061, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.5273, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 49%|####8 | 54/111 [00:36<00:38, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9615, LAS: 0.9286, UEM: 0.6585, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3896, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5292, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 52%|#####2 | 58/111 [00:38<00:34, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9623, LAS: 0.9292, UEM: 0.6673, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3596, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6037, loss: 0.5255, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 56%|#####5 | 62/111 [00:41<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9628, LAS: 0.9299, UEM: 0.6752, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5204, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 59%|#####8 | 65/111 [00:43<00:31, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9619, LAS: 0.9288, UEM: 0.6688, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.3716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.5295, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 61%|######1 | 68/111 [00:46<00:30, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9615, LAS: 0.9283, UEM: 0.6717, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3385, loss: 0.5329, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 64%|######3 | 71/111 [00:48<00:29, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9619, LAS: 0.9286, UEM: 0.6709, LEM: 0.4567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5311, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 68%|######7 | 75/111 [00:51<00:25, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9617, LAS: 0.9284, UEM: 0.6664, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4704, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5322, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 71%|#######1 | 79/111 [00:53<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9618, LAS: 0.9285, UEM: 0.6676, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2552, partial_loss/deprel_loss: 0.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.5314, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||: 74%|#######3 | 82/111 [00:56<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9618, LAS: 0.9283, UEM: 0.6666, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5323, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9617, LAS: 0.9283, UEM: 0.6735, LEM: 0.4597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0861, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8239, loss: 0.5321, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||: 80%|######## | 89/111 [01:01<00:15, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9616, LAS: 0.9283, UEM: 0.6689, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.5322, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 84%|########3 | 93/111 [01:03<00:12, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9617, LAS: 0.9281, UEM: 0.6673, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4933, loss: 0.5328, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 86%|########6 | 96/111 [01:05<00:10, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9281, UEM: 0.6644, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3597, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.5319, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 90%|######### | 100/111 [01:08<00:07, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9613, LAS: 0.9277, UEM: 0.6560, LEM: 0.4402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5347, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 95%|#########4| 105/111 [01:10<00:03, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9615, LAS: 0.9278, UEM: 0.6528, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1941, partial_loss/deprel_loss: 0.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5337, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 99%|#########9| 110/111 [01:12<00:00, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9616, LAS: 0.9279, UEM: 0.6534, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.5333, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:35:10,476 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9340, LAS: 0.8843, UEM: 0.7299, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1551, partial_loss/deprel_loss: 22.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1009, loss: 30.5976, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 15%|#5 | 2/13 [00:02<00:12, 1.10s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9563, LAS: 0.9123, UEM: 0.8067, LEM: 0.5765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 25.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 20.3500, loss: 21.9278, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 38%|###8 | 5/13 [00:05<00:08, 1.06s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9492, LAS: 0.9002, UEM: 0.7154, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 41.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2106, loss: 24.2740, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:08<00:05, 1.04s/it]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9480, LAS: 0.8980, UEM: 0.6665, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 32.8922, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4571, loss: 23.9450, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9475, LAS: 0.8973, UEM: 0.6503, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 23.6254, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9900, loss: 24.5413, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - patience | 4.000 | N/A\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.351 | 23.625\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.231 | 0.448\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - reg_loss | 0.162 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UEM | 0.653 | 0.650\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | 0.897\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - loss | 0.533 | 24.541\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEM | 0.435 | 0.389\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | 0.947\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EM | 0.935 | 0.914\n", + "2023-04-07 01:35:23,096 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:35:23,101 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:35:28,020 - INFO - combo.training.trainer - Epoch duration: 0:01:33.762829\n", + "2023-04-07 01:35:28,021 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:01\n", + "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Epoch 121/399\n", + "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:35:28,028 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9625, LAS: 0.9278, UEM: 0.6975, LEM: 0.4612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6717, loss: 0.5151, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||: 3%|2 | 3/111 [00:02<01:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9672, LAS: 0.9355, UEM: 0.7027, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2837, partial_loss/deprel_loss: 0.3431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.4797, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||: 6%|6 | 7/111 [00:04<01:10, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9678, LAS: 0.9357, UEM: 0.7548, LEM: 0.5496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6550, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7039, loss: 0.4759, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||: 9%|9 | 10/111 [00:06<01:08, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9662, LAS: 0.9341, UEM: 0.7161, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4548, loss: 0.4895, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||: 12%|#1 | 13/111 [00:08<01:07, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9625, LAS: 0.9294, UEM: 0.7186, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0669, partial_loss/deprel_loss: 0.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5213, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||: 14%|#4 | 16/111 [00:11<01:07, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9621, LAS: 0.9291, UEM: 0.6897, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5918, loss: 0.5272, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||: 18%|#8 | 20/111 [00:13<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9629, LAS: 0.9297, UEM: 0.7008, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6002, loss: 0.5215, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||: 21%|## | 23/111 [00:15<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9615, LAS: 0.9286, UEM: 0.6829, LEM: 0.4761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7517, loss: 0.5324, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 23%|##3 | 26/111 [00:17<00:59, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9601, LAS: 0.9271, UEM: 0.6503, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5419, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 27%|##7 | 30/111 [00:20<00:56, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9600, LAS: 0.9269, UEM: 0.6390, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4914, loss: 0.5444, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 30%|##9 | 33/111 [00:22<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9602, LAS: 0.9271, UEM: 0.6246, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5958, partial_loss/deprel_loss: 0.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.5440, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 33%|###3 | 37/111 [00:25<00:49, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9592, LAS: 0.9259, UEM: 0.6117, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9584, partial_loss/deprel_loss: 0.5039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7561, loss: 0.5516, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 36%|###6 | 40/111 [00:27<00:48, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9582, LAS: 0.9248, UEM: 0.5995, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8587, partial_loss/deprel_loss: 0.6059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8177, loss: 0.5590, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 39%|###8 | 43/111 [00:29<00:46, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9257, UEM: 0.6153, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1867, partial_loss/deprel_loss: 0.2768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4200, loss: 0.5514, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 41%|####1 | 46/111 [00:31<00:46, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9586, LAS: 0.9252, UEM: 0.6056, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8144, partial_loss/deprel_loss: 0.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7414, loss: 0.5554, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 45%|####5 | 50/111 [00:34<00:42, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9596, LAS: 0.9260, UEM: 0.6167, LEM: 0.3957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4083, loss: 0.5495, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||: 48%|####7 | 53/111 [00:36<00:41, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9602, LAS: 0.9265, UEM: 0.6188, LEM: 0.3926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.3921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.5468, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 51%|#####1 | 57/111 [00:39<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9598, LAS: 0.9262, UEM: 0.6186, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1625, partial_loss/deprel_loss: 0.2233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3724, loss: 0.5476, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 55%|#####4 | 61/111 [00:41<00:33, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9602, LAS: 0.9266, UEM: 0.6270, LEM: 0.4035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.5433, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 59%|#####8 | 65/111 [00:43<00:29, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9609, LAS: 0.9273, UEM: 0.6400, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.2523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3933, loss: 0.5379, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 62%|######2 | 69/111 [00:46<00:25, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9614, LAS: 0.9277, UEM: 0.6463, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2193, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4581, loss: 0.5341, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 66%|######5 | 73/111 [00:48<00:22, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9614, LAS: 0.9276, UEM: 0.6457, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5339, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 70%|####### | 78/111 [00:50<00:18, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9616, LAS: 0.9279, UEM: 0.6571, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0336, partial_loss/deprel_loss: 0.0988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2469, loss: 0.5322, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 74%|#######3 | 82/111 [00:53<00:17, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9616, LAS: 0.9279, UEM: 0.6532, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5493, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6106, loss: 0.5317, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 77%|#######7 | 86/111 [00:56<00:16, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9621, LAS: 0.9284, UEM: 0.6628, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1212, partial_loss/deprel_loss: 0.2469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5276, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||: 81%|########1 | 90/111 [00:58<00:13, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9621, LAS: 0.9284, UEM: 0.6589, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2574, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5275, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||: 85%|########4 | 94/111 [01:01<00:10, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9617, LAS: 0.9281, UEM: 0.6526, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.5303, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||: 88%|########8 | 98/111 [01:03<00:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9618, LAS: 0.9281, UEM: 0.6492, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2187, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4653, loss: 0.5298, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||: 92%|#########1| 102/111 [01:06<00:05, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9621, LAS: 0.9285, UEM: 0.6590, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1560, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3856, loss: 0.5267, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||: 95%|#########5| 106/111 [01:09<00:03, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9620, LAS: 0.9284, UEM: 0.6538, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2230, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||: 99%|#########9| 110/111 [01:11<00:00, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9620, LAS: 0.9284, UEM: 0.6522, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3857, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.360 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.386 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - reg_loss | 0.161 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UEM | 0.652 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LAS | 0.928 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - loss | 0.528 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEM | 0.433 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EM | 0.932 | N/A\n", + "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:36:43,257 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Epoch duration: 0:01:21.032962\n", + "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Estimated training time remaining: 6:20:36\n", + "2023-04-07 01:36:49,054 - INFO - allennlp.training.trainer - Epoch 122/399\n", + "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:36:49,065 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9650, LAS: 0.9338, UEM: 0.6522, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.2491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3946, loss: 0.4751, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||: 3%|2 | 3/111 [00:02<01:13, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9639, LAS: 0.9312, UEM: 0.6423, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.2690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4096, loss: 0.4931, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||: 5%|5 | 6/111 [00:04<01:15, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9595, LAS: 0.9277, UEM: 0.6090, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6391, loss: 0.5225, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||: 8%|8 | 9/111 [00:06<01:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9620, LAS: 0.9302, UEM: 0.6435, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.4132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5120, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||: 11%|# | 12/111 [00:08<01:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9622, LAS: 0.9303, UEM: 0.6295, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5368, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5119, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||: 14%|#4 | 16/111 [00:11<01:06, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9621, LAS: 0.9310, UEM: 0.6313, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.2616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4044, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||: 18%|#8 | 20/111 [00:13<01:02, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9600, LAS: 0.9284, UEM: 0.6104, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5285, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||: 22%|##1 | 24/111 [00:16<00:57, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9605, LAS: 0.9289, UEM: 0.6192, LEM: 0.3952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4484, loss: 0.5258, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||: 24%|##4 | 27/111 [00:18<00:57, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9619, LAS: 0.9303, UEM: 0.6544, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5141, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||: 27%|##7 | 30/111 [00:21<00:58, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9629, LAS: 0.9312, UEM: 0.6662, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3693, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.5084, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 30%|##9 | 33/111 [00:23<00:57, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9629, LAS: 0.9305, UEM: 0.6631, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5118, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 32%|###2 | 36/111 [00:25<00:53, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9633, LAS: 0.9313, UEM: 0.6878, LEM: 0.4793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.5070, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 35%|###5 | 39/111 [00:27<00:54, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9308, UEM: 0.6790, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4333, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5128, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 38%|###7 | 42/111 [00:29<00:50, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9631, LAS: 0.9308, UEM: 0.6764, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5079, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.5122, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 41%|#### | 45/111 [00:31<00:47, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9633, LAS: 0.9310, UEM: 0.6768, LEM: 0.4627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 45%|####5 | 50/111 [00:34<00:38, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9636, LAS: 0.9313, UEM: 0.6799, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1367, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3562, loss: 0.5074, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||: 49%|####8 | 54/111 [00:36<00:36, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9640, LAS: 0.9317, UEM: 0.6884, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4297, partial_loss/deprel_loss: 0.4490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.5048, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 52%|#####2 | 58/111 [00:39<00:34, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9637, LAS: 0.9314, UEM: 0.6777, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5461, loss: 0.5078, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 56%|#####5 | 62/111 [00:42<00:31, 1.55it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9630, LAS: 0.9305, UEM: 0.6654, LEM: 0.4556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6359, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6578, loss: 0.5146, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 59%|#####9 | 66/111 [00:44<00:28, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9625, LAS: 0.9298, UEM: 0.6570, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5197, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 63%|######3 | 70/111 [00:46<00:24, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9622, LAS: 0.9297, UEM: 0.6520, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.5635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.5221, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 68%|######7 | 75/111 [00:48<00:20, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9626, LAS: 0.9299, UEM: 0.6525, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.5188, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 72%|#######2 | 80/111 [00:51<00:16, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9625, LAS: 0.9298, UEM: 0.6539, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2805, partial_loss/deprel_loss: 0.3755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.5198, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 76%|#######5 | 84/111 [00:54<00:16, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9627, LAS: 0.9299, UEM: 0.6608, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7551, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7516, loss: 0.5183, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 79%|#######9 | 88/111 [00:56<00:14, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9627, LAS: 0.9299, UEM: 0.6589, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6415, loss: 0.5184, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||: 83%|########2 | 92/111 [00:59<00:12, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9560, UAS: 0.9624, LAS: 0.9296, UEM: 0.6645, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0866, partial_loss/deprel_loss: 0.1841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3254, loss: 0.5205, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||: 86%|########6 | 96/111 [01:03<00:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9627, LAS: 0.9298, UEM: 0.6662, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1921, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5180, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||: 90%|######### | 100/111 [01:05<00:07, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9297, UEM: 0.6625, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5188, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||: 94%|#########3| 104/111 [01:08<00:04, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9625, LAS: 0.9296, UEM: 0.6571, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4424, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.5207, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||: 97%|#########7| 108/111 [01:10<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9621, LAS: 0.9291, UEM: 0.6547, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9304, partial_loss/deprel_loss: 0.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8291, loss: 0.5234, batch_reg_loss: 0.1608, reg_loss: 0.1609 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:38:04,746 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.603 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.930 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - reg_loss | 0.161 | N/A\n", + "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UEM | 0.655 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - loss | 0.523 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEM | 0.437 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EM | 0.886 | N/A\n", + "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:38:04,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Epoch duration: 0:01:20.506074\n", + "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Estimated training time remaining: 6:19:10\n", + "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Epoch 123/399\n", + "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:38:09,562 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:38:09,571 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9549, LAS: 0.9194, UEM: 0.5681, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5232, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6516, loss: 0.6007, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 3%|2 | 3/111 [00:02<01:23, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9627, LAS: 0.9298, UEM: 0.6188, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2662, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.5094, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 6%|6 | 7/111 [00:04<01:16, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9634, LAS: 0.9311, UEM: 0.6393, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1946, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4280, loss: 0.5030, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 9%|9 | 10/111 [00:07<01:13, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9645, LAS: 0.9316, UEM: 0.6506, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2571, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5021, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 13%|#2 | 14/111 [00:09<01:08, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9662, LAS: 0.9337, UEM: 0.6572, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2175, partial_loss/deprel_loss: 0.2773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4261, loss: 0.4903, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 16%|#6 | 18/111 [00:12<01:02, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9671, LAS: 0.9346, UEM: 0.6837, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0700, partial_loss/deprel_loss: 0.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3216, loss: 0.4854, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||: 19%|#8 | 21/111 [00:14<01:02, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9682, LAS: 0.9361, UEM: 0.7249, LEM: 0.5181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.4779, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||: 22%|##1 | 24/111 [00:16<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9669, LAS: 0.9349, UEM: 0.7034, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.3622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.4832, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||: 25%|##5 | 28/111 [00:19<00:56, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9646, LAS: 0.9328, UEM: 0.6862, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4493, loss: 0.4968, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||: 29%|##8 | 32/111 [00:21<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9639, LAS: 0.9318, UEM: 0.6867, LEM: 0.4800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.5024, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||: 32%|###2 | 36/111 [00:24<00:49, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9632, LAS: 0.9314, UEM: 0.6798, LEM: 0.4733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3144, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5084, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||: 36%|###6 | 40/111 [00:26<00:45, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9624, LAS: 0.9305, UEM: 0.6818, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5125, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||: 40%|###9 | 44/111 [00:29<00:45, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9616, LAS: 0.9297, UEM: 0.6681, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4001, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.5174, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||: 42%|####2 | 47/111 [00:31<00:43, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9607, LAS: 0.9289, UEM: 0.6482, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.4718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.5269, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||: 47%|####6 | 52/111 [00:34<00:36, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9278, UEM: 0.6335, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.5339, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||: 51%|#####1 | 57/111 [00:36<00:31, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9248, UAS: 0.9601, LAS: 0.9277, UEM: 0.6278, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.3265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5320, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||: 56%|#####5 | 62/111 [00:38<00:26, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9605, LAS: 0.9281, UEM: 0.6417, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1840, partial_loss/deprel_loss: 0.2735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4163, loss: 0.5269, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 59%|#####9 | 66/111 [00:41<00:26, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9610, LAS: 0.9285, UEM: 0.6508, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2534, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.5238, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 63%|######3 | 70/111 [00:44<00:26, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9610, LAS: 0.9285, UEM: 0.6460, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6746, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6763, loss: 0.5240, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 67%|######6 | 74/111 [00:47<00:24, 1.50it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9608, LAS: 0.9282, UEM: 0.6378, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4768, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 70%|####### | 78/111 [00:49<00:21, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9609, LAS: 0.9282, UEM: 0.6335, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3490, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5159, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 74%|#######3 | 82/111 [00:52<00:18, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9609, LAS: 0.9282, UEM: 0.6348, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5278, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 77%|#######7 | 86/111 [00:54<00:15, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9612, LAS: 0.9283, UEM: 0.6366, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.2907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5276, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 81%|########1 | 90/111 [01:00<00:17, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9614, LAS: 0.9285, UEM: 0.6366, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1536, partial_loss/deprel_loss: 0.2921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4250, loss: 0.5268, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 84%|########3 | 93/111 [01:02<00:14, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9613, LAS: 0.9283, UEM: 0.6353, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6619, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 87%|########7 | 97/111 [01:05<00:10, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9613, LAS: 0.9283, UEM: 0.6374, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5876, partial_loss/deprel_loss: 0.5230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 90%|######### | 100/111 [01:07<00:08, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9616, LAS: 0.9286, UEM: 0.6455, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0841, partial_loss/deprel_loss: 0.1611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5250, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||: 93%|#########2| 103/111 [01:09<00:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9621, LAS: 0.9290, UEM: 0.6533, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0820, partial_loss/deprel_loss: 0.2228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5223, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||: 95%|#########5| 106/111 [01:11<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9618, LAS: 0.9288, UEM: 0.6516, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 0.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5359, loss: 0.5229, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||: 99%|#########9| 110/111 [01:14<00:00, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9619, LAS: 0.9288, UEM: 0.6520, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.5222, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||: 100%|##########| 111/111 [01:14<00:00, 1.48it/s]\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.296 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.243 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - reg_loss | 0.161 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UEM | 0.652 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - loss | 0.522 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEM | 0.439 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EM | 0.935 | N/A\n", + "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:39:27,740 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Epoch duration: 0:01:23.310651\n", + "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Estimated training time remaining: 6:17:51\n", + "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Epoch 124/399\n", + "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:39:32,873 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:39:32,880 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9491, LAS: 0.9161, UEM: 0.6139, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.5831, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 3%|2 | 3/111 [00:02<01:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9620, LAS: 0.9297, UEM: 0.7283, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4854, loss: 0.4947, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 6%|6 | 7/111 [00:04<01:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9588, LAS: 0.9263, UEM: 0.6802, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2412, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5317, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 9%|9 | 10/111 [00:06<01:12, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9610, LAS: 0.9292, UEM: 0.6884, LEM: 0.4948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4406, loss: 0.5143, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 12%|#1 | 13/111 [00:09<01:10, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9613, LAS: 0.9293, UEM: 0.6973, LEM: 0.5000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.5118, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 14%|#4 | 16/111 [00:11<01:11, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9637, LAS: 0.9318, UEM: 0.7138, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.2853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.4976, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 17%|#7 | 19/111 [00:14<01:11, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9640, LAS: 0.9321, UEM: 0.6946, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.4999, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 21%|## | 23/111 [00:16<01:04, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9647, LAS: 0.9322, UEM: 0.6975, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2924, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.4974, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9642, LAS: 0.9318, UEM: 0.6884, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.5012, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 27%|##7 | 30/111 [00:21<00:55, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9608, LAS: 0.9285, UEM: 0.6741, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3414, partial_loss/deprel_loss: 0.6991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9880, loss: 0.5256, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 32%|###1 | 35/111 [00:23<00:47, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9610, LAS: 0.9290, UEM: 0.6652, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.2850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.5230, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 36%|###6 | 40/111 [00:25<00:40, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9595, LAS: 0.9278, UEM: 0.6427, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7856, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6576, loss: 0.5322, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 41%|#### | 45/111 [00:27<00:35, 1.88it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9603, LAS: 0.9287, UEM: 0.6684, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1457, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.5273, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 44%|####4 | 49/111 [00:30<00:34, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9606, LAS: 0.9289, UEM: 0.6664, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.5259, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 48%|####7 | 53/111 [00:33<00:34, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9604, LAS: 0.9284, UEM: 0.6559, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4398, partial_loss/deprel_loss: 0.4302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.5301, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||: 51%|#####1 | 57/111 [00:36<00:35, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9608, LAS: 0.9289, UEM: 0.6569, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2930, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||: 55%|#####4 | 61/111 [00:39<00:33, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9612, LAS: 0.9292, UEM: 0.6546, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5240, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||: 59%|#####8 | 65/111 [00:42<00:31, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9609, LAS: 0.9288, UEM: 0.6453, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4810, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||: 62%|######2 | 69/111 [00:44<00:27, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9615, LAS: 0.9291, UEM: 0.6501, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3155, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.5236, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||: 66%|######5 | 73/111 [00:47<00:25, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9618, LAS: 0.9295, UEM: 0.6574, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1190, partial_loss/deprel_loss: 0.2381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3747, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 69%|######9 | 77/111 [00:50<00:23, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9619, LAS: 0.9296, UEM: 0.6547, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5202, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 72%|#######2 | 80/111 [00:52<00:21, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9620, LAS: 0.9295, UEM: 0.6601, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5197, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 75%|#######4 | 83/111 [00:54<00:19, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9623, LAS: 0.9298, UEM: 0.6635, LEM: 0.4503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.4249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.5184, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 78%|#######8 | 87/111 [00:57<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9623, LAS: 0.9299, UEM: 0.6621, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4647, loss: 0.5186, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 82%|########1 | 91/111 [00:59<00:13, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9624, LAS: 0.9299, UEM: 0.6604, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3465, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5171, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 85%|########4 | 94/111 [01:01<00:11, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9622, LAS: 0.9298, UEM: 0.6586, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1817, partial_loss/deprel_loss: 0.2733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.5183, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 88%|########8 | 98/111 [01:04<00:08, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9618, LAS: 0.9294, UEM: 0.6544, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 92%|#########1| 102/111 [01:07<00:05, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9622, LAS: 0.9298, UEM: 0.6596, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1177, partial_loss/deprel_loss: 0.2160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3566, loss: 0.5175, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 95%|#########5| 106/111 [01:09<00:03, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9620, LAS: 0.9296, UEM: 0.6558, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4664, loss: 0.5189, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||: 99%|#########9| 110/111 [01:12<00:00, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9619, LAS: 0.9295, UEM: 0.6539, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6005, loss: 0.5196, batch_reg_loss: 0.1602, reg_loss: 0.1604 ||: 100%|##########| 111/111 [01:13<00:00, 1.52it/s]\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.419 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.526 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | N/A\n", + "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UEM | 0.654 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - loss | 0.520 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEM | 0.437 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EM | 0.918 | N/A\n", + "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:40:49,222 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:40:54,297 - INFO - combo.training.trainer - Epoch duration: 0:01:21.425042\n", + "2023-04-07 01:40:54,298 - INFO - combo.training.trainer - Estimated training time remaining: 6:16:27\n", + "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Epoch 125/399\n", + "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:40:54,299 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:40:54,308 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9613, LAS: 0.9313, UEM: 0.6735, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5213, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5903, loss: 0.4758, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 3%|2 | 3/111 [00:02<01:25, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9645, LAS: 0.9329, UEM: 0.6774, LEM: 0.4719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3121, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5055, loss: 0.4733, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 5%|5 | 6/111 [00:04<01:24, 1.24it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9655, LAS: 0.9342, UEM: 0.6826, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.2511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3966, loss: 0.4649, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 8%|8 | 9/111 [00:07<01:23, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9650, LAS: 0.9340, UEM: 0.6952, LEM: 0.5047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5937, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.4787, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 11%|# | 12/111 [00:09<01:19, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9649, LAS: 0.9337, UEM: 0.6848, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2166, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4670, loss: 0.4813, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 14%|#4 | 16/111 [00:11<01:09, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9660, LAS: 0.9351, UEM: 0.7062, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3484, loss: 0.4730, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 19%|#8 | 21/111 [00:14<00:59, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9748, UAS: 0.9654, LAS: 0.9346, UEM: 0.7213, LEM: 0.5392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0280, partial_loss/deprel_loss: 0.0973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2436, loss: 0.4750, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 23%|##3 | 26/111 [00:17<00:52, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9653, LAS: 0.9340, UEM: 0.7162, LEM: 0.5280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1675, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3882, loss: 0.4790, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 28%|##7 | 31/111 [00:19<00:45, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9649, LAS: 0.9334, UEM: 0.7044, LEM: 0.5135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4407, loss: 0.4833, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||: 32%|###1 | 35/111 [00:22<00:47, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9654, LAS: 0.9339, UEM: 0.7023, LEM: 0.5059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3088, partial_loss/deprel_loss: 0.3605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.4810, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 35%|###5 | 39/111 [00:25<00:47, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9658, LAS: 0.9344, UEM: 0.7101, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0582, partial_loss/deprel_loss: 0.1520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2933, loss: 0.4785, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 39%|###8 | 43/111 [00:28<00:47, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9658, LAS: 0.9344, UEM: 0.7116, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1175, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3602, loss: 0.4784, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 41%|####1 | 46/111 [00:30<00:45, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9647, LAS: 0.9330, UEM: 0.7041, LEM: 0.5079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.4888, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 44%|####4 | 49/111 [00:32<00:43, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9644, LAS: 0.9326, UEM: 0.7008, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1494, partial_loss/deprel_loss: 0.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3868, loss: 0.4925, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 47%|####6 | 52/111 [00:34<00:42, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9636, LAS: 0.9317, UEM: 0.6896, LEM: 0.4940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5430, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6372, loss: 0.4988, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 50%|####9 | 55/111 [00:37<00:40, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9632, LAS: 0.9313, UEM: 0.6814, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.5032, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 52%|#####2 | 58/111 [00:39<00:38, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9635, LAS: 0.9314, UEM: 0.6849, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0668, partial_loss/deprel_loss: 0.2211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3503, loss: 0.5031, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 55%|#####4 | 61/111 [00:41<00:36, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9631, LAS: 0.9309, UEM: 0.6769, LEM: 0.4773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2835, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 59%|#####8 | 65/111 [00:43<00:31, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9631, LAS: 0.9309, UEM: 0.6753, LEM: 0.4744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2259, partial_loss/deprel_loss: 0.3241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4645, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||: 62%|######2 | 69/111 [00:46<00:28, 1.48it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9633, LAS: 0.9310, UEM: 0.6719, LEM: 0.4695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.5057, batch_reg_loss: 0.1601, reg_loss: 0.1601 ||: 66%|######5 | 73/111 [00:48<00:24, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9633, LAS: 0.9308, UEM: 0.6678, LEM: 0.4625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5254, loss: 0.5079, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 69%|######9 | 77/111 [00:52<00:23, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9636, LAS: 0.9310, UEM: 0.6684, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3835, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5635, loss: 0.5069, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 72%|#######2 | 80/111 [00:54<00:21, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9632, LAS: 0.9306, UEM: 0.6658, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.2731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5088, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 75%|#######4 | 83/111 [00:56<00:19, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9625, LAS: 0.9298, UEM: 0.6636, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5155, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 77%|#######7 | 86/111 [00:58<00:17, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9619, LAS: 0.9293, UEM: 0.6578, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4905, partial_loss/deprel_loss: 0.4107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5867, loss: 0.5193, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 81%|########1 | 90/111 [01:01<00:14, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9620, LAS: 0.9293, UEM: 0.6549, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3594, partial_loss/deprel_loss: 0.3532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 85%|########4 | 94/111 [01:03<00:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9620, LAS: 0.9293, UEM: 0.6545, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1414, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.5179, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 88%|########8 | 98/111 [01:06<00:09, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9618, LAS: 0.9291, UEM: 0.6529, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1656, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5198, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 91%|######### | 101/111 [01:08<00:06, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9616, LAS: 0.9288, UEM: 0.6486, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5981, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6592, loss: 0.5213, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 94%|#########3| 104/111 [01:10<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9617, LAS: 0.9288, UEM: 0.6468, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4200, partial_loss/deprel_loss: 0.3656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.5212, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 96%|#########6| 107/111 [01:12<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9617, LAS: 0.9290, UEM: 0.6453, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.5202, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 99%|#########9| 110/111 [01:15<00:00, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9619, LAS: 0.9291, UEM: 0.6506, LEM: 0.4377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1172, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3705, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 100%|##########| 111/111 [01:16<00:00, 1.46it/s]\n", + "2023-04-07 01:42:13,636 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9530, LAS: 0.9045, UEM: 0.6088, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 16.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 13.5082, loss: 20.0456, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.05it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9492, LAS: 0.8996, UEM: 0.5886, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 25.1117, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1702, loss: 22.7926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.04it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9418, LAS: 0.8909, UEM: 0.5511, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3135, partial_loss/deprel_loss: 45.1808, partial_loss/cycle_loss: 0.0000, batch_loss: 36.4074, loss: 26.0686, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.08it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00, 1.20it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00, 1.21it/s]\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - patience | 3.000 | N/A\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.234 | 28.291\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.117 | 0.745\n", + "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | 0.000\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UEM | 0.651 | 0.654\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | 0.899\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - loss | 0.519 | 24.272\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEM | 0.438 | 0.400\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | 0.948\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EM | 0.947 | 0.888\n", + "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:42:24,432 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Epoch duration: 0:01:36.805760\n", + "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Estimated training time remaining: 6:15:37\n", + "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Epoch 126/399\n", + "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:42:31,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:42:31,115 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9523, LAS: 0.9153, UEM: 0.4448, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8348, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.6257, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||: 3%|2 | 3/111 [00:02<01:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9519, LAS: 0.9174, UEM: 0.4296, LEM: 0.1925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.6160, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||: 5%|5 | 6/111 [00:04<01:16, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9612, LAS: 0.9279, UEM: 0.6479, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1347, partial_loss/deprel_loss: 0.2565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5449, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||: 8%|8 | 9/111 [00:06<01:17, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9587, LAS: 0.9255, UEM: 0.5725, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3705, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.5659, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||: 12%|#1 | 13/111 [00:09<01:11, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9550, LAS: 0.9218, UEM: 0.5284, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.5809, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||: 14%|#4 | 16/111 [00:11<01:08, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9576, LAS: 0.9248, UEM: 0.5812, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1394, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3411, loss: 0.5551, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||: 17%|#7 | 19/111 [00:13<01:07, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9591, LAS: 0.9260, UEM: 0.6086, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5340, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.5456, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||: 20%|#9 | 22/111 [00:16<01:04, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9265, UEM: 0.6058, LEM: 0.3898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.5419, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||: 23%|##2 | 25/111 [00:18<01:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9592, LAS: 0.9265, UEM: 0.5935, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5441, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||: 25%|##5 | 28/111 [00:20<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9607, LAS: 0.9278, UEM: 0.6173, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0671, partial_loss/deprel_loss: 0.2273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5343, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 29%|##8 | 32/111 [00:23<00:56, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9618, LAS: 0.9291, UEM: 0.6616, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0308, partial_loss/deprel_loss: 0.1074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2519, loss: 0.5274, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 32%|###1 | 35/111 [00:25<00:57, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9629, LAS: 0.9300, UEM: 0.6791, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1931, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4101, loss: 0.5188, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 34%|###4 | 38/111 [00:28<00:55, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9631, LAS: 0.9299, UEM: 0.6741, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5209, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 37%|###6 | 41/111 [00:30<00:53, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9636, LAS: 0.9306, UEM: 0.6738, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3950, loss: 0.5159, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 40%|###9 | 44/111 [00:32<00:49, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9616, LAS: 0.9286, UEM: 0.6619, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1917, partial_loss/deprel_loss: 0.6342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.5302, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 42%|####2 | 47/111 [00:34<00:46, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9616, LAS: 0.9287, UEM: 0.6567, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3388, partial_loss/deprel_loss: 0.3337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.5289, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 45%|####5 | 50/111 [00:36<00:43, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9619, LAS: 0.9291, UEM: 0.6671, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5651, loss: 0.5256, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||: 48%|####7 | 53/111 [00:38<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9622, LAS: 0.9292, UEM: 0.6709, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3431, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.5249, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 51%|#####1 | 57/111 [00:41<00:37, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9625, LAS: 0.9295, UEM: 0.6701, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1366, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5231, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 55%|#####4 | 61/111 [00:43<00:32, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9627, LAS: 0.9295, UEM: 0.6651, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5233, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 59%|#####8 | 65/111 [00:46<00:30, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9625, LAS: 0.9294, UEM: 0.6603, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.5236, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 62%|######2 | 69/111 [00:49<00:28, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9630, LAS: 0.9299, UEM: 0.6681, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2423, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5196, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 65%|######4 | 72/111 [00:51<00:27, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9628, LAS: 0.9297, UEM: 0.6628, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5273, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.5218, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 68%|######7 | 75/111 [00:54<00:27, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9633, LAS: 0.9302, UEM: 0.6708, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1428, partial_loss/deprel_loss: 0.2046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3520, loss: 0.5175, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 71%|#######1 | 79/111 [00:56<00:23, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9638, LAS: 0.9310, UEM: 0.6793, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0782, partial_loss/deprel_loss: 0.1631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3059, loss: 0.5128, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 75%|#######4 | 83/111 [00:59<00:20, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9306, UEM: 0.6747, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.5153, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 78%|#######8 | 87/111 [01:02<00:16, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9633, LAS: 0.9305, UEM: 0.6681, LEM: 0.4555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.5166, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||: 82%|########1 | 91/111 [01:04<00:12, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9631, LAS: 0.9301, UEM: 0.6639, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1869, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.5193, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||: 86%|########5 | 95/111 [01:06<00:10, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9625, LAS: 0.9295, UEM: 0.6547, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6074, loss: 0.5237, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||: 90%|######### | 100/111 [01:09<00:06, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9627, LAS: 0.9297, UEM: 0.6560, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2675, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4424, loss: 0.5225, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||: 94%|#########3| 104/111 [01:11<00:03, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9630, LAS: 0.9299, UEM: 0.6602, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5203, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||: 97%|#########7| 108/111 [01:13<00:01, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9630, LAS: 0.9301, UEM: 0.6596, LEM: 0.4437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.2761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4179, loss: 0.5199, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||: 100%|##########| 111/111 [01:15<00:00, 1.46it/s]\n", + "2023-04-07 01:43:50,185 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.276 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.186 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UEM | 0.660 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - LAS | 0.930 | N/A\n", + "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - loss | 0.520 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEM | 0.444 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EM | 0.943 | N/A\n", + "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:43:50,192 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:44:00,241 - INFO - combo.training.trainer - Epoch duration: 0:01:29.136743\n", + "2023-04-07 01:44:00,242 - INFO - combo.training.trainer - Estimated training time remaining: 6:14:29\n", + "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Epoch 127/399\n", + "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:44:00,243 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:44:00,251 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9666, LAS: 0.9335, UEM: 0.6822, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5529, loss: 0.4783, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 3%|2 | 3/111 [00:02<01:17, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9638, LAS: 0.9309, UEM: 0.6726, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5058, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 5%|5 | 6/111 [00:04<01:16, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9283, UEM: 0.5965, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2555, partial_loss/deprel_loss: 0.3948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5256, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 9%|9 | 10/111 [00:06<01:10, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9636, LAS: 0.9300, UEM: 0.6324, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6324, loss: 0.5159, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 12%|#1 | 13/111 [00:09<01:11, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9637, LAS: 0.9308, UEM: 0.6668, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.4497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6541, loss: 0.5116, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 14%|#4 | 16/111 [00:11<01:10, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9639, LAS: 0.9320, UEM: 0.6639, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 0.2366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5048, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||: 18%|#8 | 20/111 [00:14<01:05, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9655, LAS: 0.9335, UEM: 0.6962, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.2687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4052, loss: 0.4916, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 21%|## | 23/111 [00:16<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9646, LAS: 0.9324, UEM: 0.6944, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5116, loss: 0.4969, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 23%|##3 | 26/111 [00:18<01:00, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9652, LAS: 0.9334, UEM: 0.7096, LEM: 0.5095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.3340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.4899, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 26%|##6 | 29/111 [00:20<00:58, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9649, LAS: 0.9331, UEM: 0.7063, LEM: 0.5084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5047, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5840, loss: 0.4897, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 29%|##8 | 32/111 [00:22<00:55, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9646, LAS: 0.9326, UEM: 0.7006, LEM: 0.5012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4657, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.4926, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 32%|###1 | 35/111 [00:25<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9638, LAS: 0.9318, UEM: 0.6895, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.4363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6079, loss: 0.4988, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||: 34%|###4 | 38/111 [00:27<00:52, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9643, LAS: 0.9322, UEM: 0.6923, LEM: 0.4881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.4965, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||: 37%|###6 | 41/111 [00:29<00:49, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9650, LAS: 0.9329, UEM: 0.6934, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.4947, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||: 41%|#### | 45/111 [00:31<00:45, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9646, LAS: 0.9323, UEM: 0.6840, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3669, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5969, loss: 0.4992, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||: 43%|####3 | 48/111 [00:34<00:44, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9263, UAS: 0.9646, LAS: 0.9325, UEM: 0.6855, LEM: 0.4765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.4968, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||: 46%|####5 | 51/111 [00:36<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9644, LAS: 0.9320, UEM: 0.6830, LEM: 0.4708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5002, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||: 50%|####9 | 55/111 [00:38<00:37, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9638, LAS: 0.9313, UEM: 0.6721, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5043, loss: 0.5036, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 53%|#####3 | 59/111 [00:41<00:34, 1.52it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9633, LAS: 0.9308, UEM: 0.6646, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2075, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4249, loss: 0.5076, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 57%|#####6 | 63/111 [00:43<00:31, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9636, LAS: 0.9312, UEM: 0.6650, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1355, partial_loss/deprel_loss: 0.2434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5041, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 60%|###### | 67/111 [00:46<00:28, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9630, LAS: 0.9306, UEM: 0.6607, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4728, loss: 0.5077, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 64%|######3 | 71/111 [00:48<00:25, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9626, LAS: 0.9302, UEM: 0.6624, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1859, partial_loss/deprel_loss: 0.6156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8891, loss: 0.5098, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 68%|######7 | 75/111 [00:51<00:24, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9623, LAS: 0.9297, UEM: 0.6539, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4116, partial_loss/deprel_loss: 0.3849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.5136, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 71%|#######1 | 79/111 [00:53<00:20, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9624, LAS: 0.9298, UEM: 0.6510, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2462, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5126, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 75%|#######4 | 83/111 [00:56<00:18, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9621, LAS: 0.9296, UEM: 0.6472, LEM: 0.4299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1450, partial_loss/deprel_loss: 0.2571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5159, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 78%|#######8 | 87/111 [00:59<00:16, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9611, LAS: 0.9285, UEM: 0.6402, LEM: 0.4247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7101, loss: 0.5234, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 81%|########1 | 90/111 [01:01<00:14, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9616, LAS: 0.9290, UEM: 0.6462, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.3448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4917, loss: 0.5197, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 85%|########4 | 94/111 [01:04<00:11, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9612, LAS: 0.9286, UEM: 0.6422, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1579, partial_loss/deprel_loss: 0.2391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.5220, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 88%|########8 | 98/111 [01:06<00:08, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9614, LAS: 0.9288, UEM: 0.6433, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2286, partial_loss/deprel_loss: 0.3183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4598, loss: 0.5200, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||: 93%|#########2| 103/111 [01:08<00:04, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9617, LAS: 0.9292, UEM: 0.6548, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2527, loss: 0.5181, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||: 97%|#########7| 108/111 [01:11<00:01, 1.73it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9619, LAS: 0.9293, UEM: 0.6544, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1877, partial_loss/deprel_loss: 0.2913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.5172, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00, 1.52it/s]\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.291 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.188 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - reg_loss | 0.160 | N/A\n", + "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UEM | 0.654 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LAS | 0.929 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - loss | 0.517 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEM | 0.441 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EM | 0.946 | N/A\n", + "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:45:16,364 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Epoch duration: 0:01:21.013571\n", + "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:13:04\n", + "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Epoch 128/399\n", + "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:45:21,258 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:45:21,267 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9686, LAS: 0.9401, UEM: 0.8848, LEM: 0.7510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7817, partial_loss/deprel_loss: 0.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6887, loss: 0.4405, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 3%|2 | 3/111 [00:02<01:29, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9672, LAS: 0.9368, UEM: 0.8125, LEM: 0.6448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3749, loss: 0.4518, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 5%|5 | 6/111 [00:04<01:22, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9654, LAS: 0.9340, UEM: 0.7629, LEM: 0.5667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3529, partial_loss/deprel_loss: 0.3521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.4713, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 9%|9 | 10/111 [00:07<01:14, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9637, LAS: 0.9319, UEM: 0.7178, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.4924, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 12%|#1 | 13/111 [00:09<01:10, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9636, LAS: 0.9311, UEM: 0.6900, LEM: 0.4815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5605, loss: 0.5032, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 14%|#4 | 16/111 [00:11<01:07, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9628, LAS: 0.9302, UEM: 0.6866, LEM: 0.4737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4747, loss: 0.5149, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 17%|#7 | 19/111 [00:13<01:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9633, LAS: 0.9300, UEM: 0.6896, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3266, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.5101, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 20%|#9 | 22/111 [00:15<01:02, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9712, UAS: 0.9636, LAS: 0.9310, UEM: 0.7128, LEM: 0.5145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0364, partial_loss/deprel_loss: 0.1140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2578, loss: 0.5061, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 23%|##3 | 26/111 [00:18<01:01, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9634, LAS: 0.9309, UEM: 0.6973, LEM: 0.4973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3625, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5099, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||: 26%|##6 | 29/111 [00:20<01:00, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9631, LAS: 0.9306, UEM: 0.6848, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.5138, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 29%|##8 | 32/111 [00:22<00:57, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9634, LAS: 0.9310, UEM: 0.6844, LEM: 0.4811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4400, loss: 0.5123, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 32%|###1 | 35/111 [00:24<00:54, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9637, LAS: 0.9314, UEM: 0.6839, LEM: 0.4814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3352, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5554, loss: 0.5115, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 35%|###5 | 39/111 [00:27<00:49, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9635, LAS: 0.9312, UEM: 0.6794, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5129, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 38%|###7 | 42/111 [00:29<00:49, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9634, LAS: 0.9313, UEM: 0.6717, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2903, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4656, loss: 0.5106, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 41%|####1 | 46/111 [00:32<00:44, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9631, LAS: 0.9309, UEM: 0.6701, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.5113, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 44%|####4 | 49/111 [00:34<00:43, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9639, LAS: 0.9318, UEM: 0.6815, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1246, partial_loss/deprel_loss: 0.2929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4186, loss: 0.5053, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 47%|####6 | 52/111 [00:36<00:41, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9647, LAS: 0.9326, UEM: 0.6911, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2317, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4588, loss: 0.4997, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 50%|##### | 56/111 [00:39<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9643, LAS: 0.9323, UEM: 0.6836, LEM: 0.4717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5482, partial_loss/deprel_loss: 0.4451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.5023, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 53%|#####3 | 59/111 [00:41<00:36, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9643, LAS: 0.9320, UEM: 0.6791, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5038, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||: 56%|#####5 | 62/111 [00:43<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9637, LAS: 0.9313, UEM: 0.6766, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1466, partial_loss/deprel_loss: 0.2395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3802, loss: 0.5083, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||: 59%|#####8 | 65/111 [00:45<00:32, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9310, UEM: 0.6691, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5409, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5110, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||: 61%|######1 | 68/111 [00:47<00:30, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9635, LAS: 0.9313, UEM: 0.6709, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.5081, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 64%|######3 | 71/111 [00:49<00:28, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9629, LAS: 0.9306, UEM: 0.6680, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3841, loss: 0.5118, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 68%|######7 | 75/111 [00:52<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9399, UAS: 0.9630, LAS: 0.9309, UEM: 0.6637, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4938, loss: 0.5100, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 71%|#######1 | 79/111 [00:54<00:20, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9628, LAS: 0.9307, UEM: 0.6595, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2778, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4650, loss: 0.5112, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 76%|#######5 | 84/111 [00:56<00:15, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9622, LAS: 0.9302, UEM: 0.6550, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.5147, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 79%|#######9 | 88/111 [00:59<00:13, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9305, UEM: 0.6550, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.2957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5130, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 84%|########3 | 93/111 [01:01<00:09, 1.85it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9624, LAS: 0.9306, UEM: 0.6547, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4645, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5553, loss: 0.5128, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 87%|########7 | 97/111 [01:03<00:07, 1.76it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9625, LAS: 0.9306, UEM: 0.6569, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5331, partial_loss/deprel_loss: 0.3988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5848, loss: 0.5122, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 91%|######### | 101/111 [01:06<00:06, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9622, LAS: 0.9302, UEM: 0.6549, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1454, partial_loss/deprel_loss: 0.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4117, loss: 0.5142, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 95%|#########4| 105/111 [01:09<00:03, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9624, LAS: 0.9303, UEM: 0.6560, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5129, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 98%|#########8| 109/111 [01:12<00:01, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9622, LAS: 0.9302, UEM: 0.6526, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5603, partial_loss/deprel_loss: 0.4172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5139, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 01:46:37,762 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.417 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.560 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - reg_loss | 0.159 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UEM | 0.653 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - LAS | 0.930 | N/A\n", + "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - loss | 0.514 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEM | 0.439 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - UAS | 0.962 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EM | 0.918 | N/A\n", + "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:46:37,768 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:46:41,880 - INFO - combo.training.trainer - Epoch duration: 0:01:20.623541\n", + "2023-04-07 01:46:41,881 - INFO - combo.training.trainer - Estimated training time remaining: 6:11:38\n", + "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Epoch 129/399\n", + "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:46:41,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:46:41,889 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9571, LAS: 0.9253, UEM: 0.6291, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8287, partial_loss/deprel_loss: 0.4590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.5324, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||: 3%|2 | 3/111 [00:02<01:26, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9592, LAS: 0.9265, UEM: 0.5725, LEM: 0.3463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4818, partial_loss/deprel_loss: 0.4078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.5464, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||: 5%|5 | 6/111 [00:04<01:20, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9626, LAS: 0.9302, UEM: 0.5930, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3725, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.5211, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||: 8%|8 | 9/111 [00:06<01:15, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9638, LAS: 0.9326, UEM: 0.6199, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.3696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5467, loss: 0.5010, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 11%|# | 12/111 [00:08<01:11, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9640, LAS: 0.9327, UEM: 0.6444, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1979, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4470, loss: 0.4944, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 14%|#3 | 15/111 [00:10<01:09, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9640, LAS: 0.9322, UEM: 0.6360, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.2993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4501, loss: 0.4992, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 16%|#6 | 18/111 [00:12<01:06, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9635, LAS: 0.9319, UEM: 0.6334, LEM: 0.4055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.4422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5011, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 19%|#8 | 21/111 [00:15<01:07, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9634, LAS: 0.9314, UEM: 0.6320, LEM: 0.3991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2485, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4827, loss: 0.5029, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 22%|##1 | 24/111 [00:17<01:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9630, LAS: 0.9313, UEM: 0.6391, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.2535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3956, loss: 0.5036, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 25%|##5 | 28/111 [00:19<00:57, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9631, LAS: 0.9318, UEM: 0.6667, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0664, partial_loss/deprel_loss: 0.1603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3006, loss: 0.4998, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 28%|##7 | 31/111 [00:22<00:57, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9316, UEM: 0.6514, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5565, partial_loss/deprel_loss: 0.4437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.5023, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 32%|###1 | 35/111 [00:24<00:53, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9644, LAS: 0.9331, UEM: 0.6810, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.4920, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 34%|###4 | 38/111 [00:27<00:52, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9647, LAS: 0.9334, UEM: 0.6813, LEM: 0.4670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.1904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3441, loss: 0.4904, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||: 37%|###6 | 41/111 [00:29<00:50, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9655, LAS: 0.9341, UEM: 0.6899, LEM: 0.4729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.4847, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 40%|###9 | 44/111 [00:31<00:49, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9650, LAS: 0.9336, UEM: 0.6775, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.3938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.4880, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 43%|####3 | 48/111 [00:34<00:43, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9650, LAS: 0.9337, UEM: 0.6821, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0927, partial_loss/deprel_loss: 0.2014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3387, loss: 0.4874, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 46%|####5 | 51/111 [00:36<00:43, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9645, LAS: 0.9329, UEM: 0.6861, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4239, loss: 0.4911, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 49%|####8 | 54/111 [00:38<00:41, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9640, LAS: 0.9326, UEM: 0.6750, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.3833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5540, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 52%|#####2 | 58/111 [00:41<00:36, 1.44it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9638, LAS: 0.9325, UEM: 0.6746, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6530, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5956, loss: 0.4935, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 56%|#####5 | 62/111 [00:43<00:32, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9447, UAS: 0.9637, LAS: 0.9322, UEM: 0.6696, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.4968, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 59%|#####9 | 66/111 [00:45<00:28, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9640, LAS: 0.9326, UEM: 0.6803, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.4428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 63%|######3 | 70/111 [00:47<00:24, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9629, LAS: 0.9315, UEM: 0.6715, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6440, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.5023, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 67%|######6 | 74/111 [00:49<00:21, 1.75it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9632, LAS: 0.9317, UEM: 0.6740, LEM: 0.4683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.2518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.5003, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 71%|#######1 | 79/111 [00:52<00:17, 1.86it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9632, LAS: 0.9317, UEM: 0.6723, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5215, loss: 0.5008, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||: 75%|#######4 | 83/111 [00:54<00:15, 1.82it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9627, LAS: 0.9313, UEM: 0.6709, LEM: 0.4648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5027, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 78%|#######8 | 87/111 [00:57<00:14, 1.65it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9632, LAS: 0.9318, UEM: 0.6740, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1702, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5005, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 82%|########1 | 91/111 [01:00<00:12, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9632, LAS: 0.9318, UEM: 0.6711, LEM: 0.4630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.5009, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 86%|########5 | 95/111 [01:03<00:10, 1.53it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9633, LAS: 0.9318, UEM: 0.6691, LEM: 0.4596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4655, loss: 0.5007, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 89%|########9 | 99/111 [01:05<00:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9627, LAS: 0.9312, UEM: 0.6639, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8737, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7585, loss: 0.5051, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 93%|#########2| 103/111 [01:08<00:05, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9626, LAS: 0.9309, UEM: 0.6591, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2589, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4974, loss: 0.5073, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 96%|#########6| 107/111 [01:11<00:02, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.311 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.279 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - reg_loss | 0.159 | N/A\n", + "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - UEM | 0.655 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - loss | 0.507 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEM | 0.445 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - EM | 0.942 | N/A\n", + "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2023-04-07 01:47:59,081 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Epoch duration: 0:01:24.181700\n", + "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Estimated training time remaining: 6:10:20\n", + "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Epoch 130/399\n", + "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:48:06,064 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:48:06,073 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9644, LAS: 0.9321, UEM: 0.6007, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4464, loss: 0.5070, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||: 4%|3 | 4/111 [00:02<01:06, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9630, LAS: 0.9319, UEM: 0.5347, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2984, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5272, loss: 0.5090, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||: 7%|7 | 8/111 [00:05<01:05, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9602, LAS: 0.9286, UEM: 0.5392, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5463, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.5236, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||: 11%|# | 12/111 [00:07<01:00, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9631, LAS: 0.9321, UEM: 0.5913, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1982, partial_loss/deprel_loss: 0.2946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 0.5061, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||: 14%|#3 | 15/111 [00:09<01:00, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9651, LAS: 0.9341, UEM: 0.6675, LEM: 0.4530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1868, partial_loss/deprel_loss: 0.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4295, loss: 0.4874, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||: 16%|#6 | 18/111 [00:11<01:02, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9650, LAS: 0.9341, UEM: 0.6555, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1861, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4318, loss: 0.4924, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||: 19%|#8 | 21/111 [00:13<01:01, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9653, LAS: 0.9344, UEM: 0.6473, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5355, loss: 0.4921, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||: 22%|##1 | 24/111 [00:15<00:59, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9638, LAS: 0.9329, UEM: 0.6244, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6071, loss: 0.5015, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||: 25%|##5 | 28/111 [00:18<00:55, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9630, LAS: 0.9317, UEM: 0.6259, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.5592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8053, loss: 0.5075, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||: 29%|##8 | 32/111 [00:21<00:52, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9632, LAS: 0.9318, UEM: 0.6266, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6027, loss: 0.5074, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 32%|###2 | 36/111 [00:23<00:48, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9640, LAS: 0.9322, UEM: 0.6423, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.4993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.5044, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 36%|###6 | 40/111 [00:26<00:46, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9647, LAS: 0.9332, UEM: 0.6779, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1671, partial_loss/deprel_loss: 0.2614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.4988, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 39%|###8 | 43/111 [00:29<00:50, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9657, LAS: 0.9343, UEM: 0.7038, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3558, loss: 0.4886, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 42%|####2 | 47/111 [00:31<00:44, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9643, LAS: 0.9328, UEM: 0.6897, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6428, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.4994, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||: 47%|####6 | 52/111 [00:34<00:37, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9641, LAS: 0.9324, UEM: 0.6784, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5417, loss: 0.5004, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 51%|#####1 | 57/111 [00:36<00:31, 1.71it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9646, LAS: 0.9329, UEM: 0.6881, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1164, partial_loss/deprel_loss: 0.2322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3677, loss: 0.4959, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 55%|#####4 | 61/111 [00:38<00:29, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9646, LAS: 0.9331, UEM: 0.6927, LEM: 0.4829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7745, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.4928, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 59%|#####8 | 65/111 [00:41<00:28, 1.60it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9634, LAS: 0.9317, UEM: 0.6818, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6007, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.5024, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 62%|######2 | 69/111 [00:44<00:28, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9624, LAS: 0.9309, UEM: 0.6704, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.4756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6991, loss: 0.5085, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 66%|######5 | 73/111 [00:47<00:26, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9618, LAS: 0.9302, UEM: 0.6615, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.5133, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 68%|######8 | 76/111 [00:49<00:24, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9620, LAS: 0.9302, UEM: 0.6593, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1839, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.5124, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 71%|#######1 | 79/111 [00:51<00:22, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9622, LAS: 0.9302, UEM: 0.6649, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0736, partial_loss/deprel_loss: 0.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3674, loss: 0.5128, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 74%|#######3 | 82/111 [00:54<00:21, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9626, LAS: 0.9307, UEM: 0.6698, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5096, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 77%|#######6 | 85/111 [00:56<00:19, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9628, LAS: 0.9308, UEM: 0.6682, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3937, partial_loss/deprel_loss: 0.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.5091, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 79%|#######9 | 88/111 [00:58<00:17, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9630, LAS: 0.9310, UEM: 0.6678, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.5076, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 82%|########1 | 91/111 [01:00<00:14, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9628, LAS: 0.9308, UEM: 0.6676, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0291, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.5087, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 85%|########4 | 94/111 [01:03<00:12, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9626, LAS: 0.9306, UEM: 0.6626, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5218, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6246, loss: 0.5101, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 87%|########7 | 97/111 [01:05<00:10, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9626, LAS: 0.9306, UEM: 0.6591, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3161, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4923, loss: 0.5099, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||: 91%|######### | 101/111 [01:08<00:07, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9627, LAS: 0.9307, UEM: 0.6601, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7448, partial_loss/deprel_loss: 0.5054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7119, loss: 0.5095, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||: 95%|#########4| 105/111 [01:10<00:04, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9627, LAS: 0.9308, UEM: 0.6589, LEM: 0.4450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3709, loss: 0.5088, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||: 98%|#########8| 109/111 [01:13<00:01, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9627, LAS: 0.9307, UEM: 0.6574, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6138, partial_loss/deprel_loss: 0.4042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.5099, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||: 100%|##########| 111/111 [01:14<00:00, 1.49it/s]\n", + "2023-04-07 01:49:23,847 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9558, LAS: 0.9078, UEM: 0.7180, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4751, partial_loss/deprel_loss: 23.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8436, loss: 24.3775, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:08, 1.14it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9387, LAS: 0.8868, UEM: 0.5723, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6799, partial_loss/deprel_loss: 53.1680, partial_loss/cycle_loss: 0.0000, batch_loss: 42.8704, loss: 28.7997, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9395, LAS: 0.8866, UEM: 0.5282, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7739, partial_loss/deprel_loss: 28.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 22.8540, loss: 27.7545, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 69%|######9 | 9/13 [00:08<00:03, 1.07it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9457, LAS: 0.8958, UEM: 0.6517, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 17.1259, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7388, loss: 25.1794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.00s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.01it/s]\n", + "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - patience | 2.000 | N/A\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.404 | 23.087\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.614 | 0.590\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - reg_loss | 0.159 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UEM | 0.657 | 0.660\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | 0.898\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - loss | 0.510 | 24.278\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEM | 0.443 | 0.394\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | 0.948\n", + "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - EM | 0.916 | 0.901\n", + "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:49:36,772 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:49:41,759 - INFO - combo.training.trainer - Epoch duration: 0:01:35.695957\n", + "2023-04-07 01:49:41,760 - INFO - combo.training.trainer - Estimated training time remaining: 6:09:25\n", + "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Epoch 131/399\n", + "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:49:41,761 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:49:41,771 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9658, LAS: 0.9335, UEM: 0.6562, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.3432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4763, loss: 0.4845, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 3%|2 | 3/111 [00:02<01:25, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9690, LAS: 0.9351, UEM: 0.6834, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2940, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4639, loss: 0.4758, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 5%|5 | 6/111 [00:04<01:19, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9650, LAS: 0.9318, UEM: 0.6375, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.2715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5000, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 9%|9 | 10/111 [00:06<01:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9639, LAS: 0.9309, UEM: 0.6198, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4991, partial_loss/deprel_loss: 0.4957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.5093, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 14%|#3 | 15/111 [00:09<01:00, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9632, LAS: 0.9305, UEM: 0.6157, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7437, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6957, loss: 0.5132, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 17%|#7 | 19/111 [00:11<00:58, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9644, LAS: 0.9318, UEM: 0.6112, LEM: 0.3696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3087, partial_loss/deprel_loss: 0.3383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4910, loss: 0.5065, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 21%|## | 23/111 [00:13<00:52, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9700, UAS: 0.9657, LAS: 0.9339, UEM: 0.6792, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0435, partial_loss/deprel_loss: 0.1104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.4905, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 24%|##4 | 27/111 [00:16<00:52, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9643, LAS: 0.9328, UEM: 0.6564, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3674, partial_loss/deprel_loss: 0.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.4984, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 28%|##7 | 31/111 [00:18<00:49, 1.63it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9642, LAS: 0.9326, UEM: 0.6407, LEM: 0.4252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3813, partial_loss/deprel_loss: 0.3253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.4981, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||: 32%|###2 | 36/111 [00:20<00:42, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9645, LAS: 0.9329, UEM: 0.6449, LEM: 0.4271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4363, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.4958, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 37%|###6 | 41/111 [00:23<00:37, 1.85it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9644, LAS: 0.9328, UEM: 0.6491, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4255, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5944, loss: 0.4963, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 41%|#### | 45/111 [00:26<00:38, 1.70it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9642, LAS: 0.9327, UEM: 0.6549, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3966, partial_loss/deprel_loss: 0.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5328, loss: 0.4974, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 44%|####4 | 49/111 [00:28<00:37, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9646, LAS: 0.9330, UEM: 0.6640, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3283, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.4947, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 48%|####7 | 53/111 [00:31<00:37, 1.57it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9653, LAS: 0.9338, UEM: 0.6784, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.4883, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 51%|#####1 | 57/111 [00:34<00:37, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9657, LAS: 0.9338, UEM: 0.6797, LEM: 0.4635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1760, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.4867, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 55%|#####4 | 61/111 [00:37<00:34, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9659, LAS: 0.9341, UEM: 0.6800, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4860, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 58%|#####7 | 64/111 [00:39<00:32, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9655, LAS: 0.9335, UEM: 0.6778, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4140, loss: 0.4904, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 61%|######1 | 68/111 [00:42<00:29, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9646, LAS: 0.9325, UEM: 0.6730, LEM: 0.4548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6611, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6527, loss: 0.4967, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||: 64%|######3 | 71/111 [00:44<00:27, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9640, LAS: 0.9318, UEM: 0.6679, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4213, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.5014, batch_reg_loss: 0.1585, reg_loss: 0.1585 ||: 68%|######7 | 75/111 [00:46<00:24, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9636, LAS: 0.9316, UEM: 0.6655, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5326, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 71%|#######1 | 79/111 [00:49<00:21, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9635, LAS: 0.9314, UEM: 0.6593, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4088, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5036, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 74%|#######3 | 82/111 [00:51<00:19, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9638, LAS: 0.9319, UEM: 0.6595, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3843, loss: 0.5006, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 77%|#######7 | 86/111 [00:54<00:16, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9638, LAS: 0.9319, UEM: 0.6648, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6573, partial_loss/deprel_loss: 0.5130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5010, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 80%|######## | 89/111 [00:56<00:15, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9636, LAS: 0.9317, UEM: 0.6590, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4891, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.5029, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 84%|########3 | 93/111 [00:59<00:11, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9635, LAS: 0.9316, UEM: 0.6583, LEM: 0.4467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1251, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3658, loss: 0.5027, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 87%|########7 | 97/111 [01:02<00:09, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9636, LAS: 0.9318, UEM: 0.6572, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 90%|######### | 100/111 [01:04<00:07, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9639, LAS: 0.9319, UEM: 0.6622, LEM: 0.4478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2035, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.5003, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 93%|#########2| 103/111 [01:06<00:05, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9637, LAS: 0.9318, UEM: 0.6594, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7736, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.5017, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 95%|#########5| 106/111 [01:08<00:03, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9633, LAS: 0.9314, UEM: 0.6576, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5178, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 98%|#########8| 109/111 [01:10<00:01, 1.41it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9633, LAS: 0.9314, UEM: 0.6589, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 100%|##########| 111/111 [01:12<00:00, 1.53it/s]\n", + "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.421 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.580 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - reg_loss | 0.159 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - UEM | 0.659 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - loss | 0.504 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEM | 0.444 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - EM | 0.916 | N/A\n", + "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:50:57,372 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Epoch duration: 0:01:22.576860\n", + "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Estimated training time remaining: 6:08:03\n", + "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Epoch 132/399\n", + "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:51:04,339 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:51:04,348 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9355, LAS: 0.9035, UEM: 0.2982, LEM: 0.1404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5630, loss: 0.6882, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||: 3%|2 | 3/111 [00:02<01:25, 1.26it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9504, LAS: 0.9180, UEM: 0.5783, LEM: 0.3771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1050, partial_loss/deprel_loss: 0.2255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3598, loss: 0.5970, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||: 6%|6 | 7/111 [00:04<01:14, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9573, LAS: 0.9259, UEM: 0.6287, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5310, partial_loss/deprel_loss: 0.3926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.5515, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||: 11%|# | 12/111 [00:06<01:04, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9604, LAS: 0.9291, UEM: 0.6289, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5247, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||: 15%|#5 | 17/111 [00:09<00:55, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9363, UAS: 0.9596, LAS: 0.9288, UEM: 0.5911, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.2964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4441, loss: 0.5271, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||: 20%|#9 | 22/111 [00:11<00:49, 1.80it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9608, LAS: 0.9298, UEM: 0.6044, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1252, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3657, loss: 0.5187, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 23%|##3 | 26/111 [00:14<00:49, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9616, LAS: 0.9301, UEM: 0.6135, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5136, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 27%|##7 | 30/111 [00:16<00:48, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9613, LAS: 0.9295, UEM: 0.5998, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 0.3298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4667, loss: 0.5181, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 31%|### | 34/111 [00:19<00:46, 1.67it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9620, LAS: 0.9306, UEM: 0.6366, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0532, partial_loss/deprel_loss: 0.1433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2835, loss: 0.5104, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 34%|###4 | 38/111 [00:22<00:48, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9631, LAS: 0.9317, UEM: 0.6435, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.5039, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 38%|###7 | 42/111 [00:24<00:43, 1.57it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9622, LAS: 0.9310, UEM: 0.6257, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6065, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5105, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 41%|####1 | 46/111 [00:27<00:41, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9623, LAS: 0.9310, UEM: 0.6233, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4085, partial_loss/deprel_loss: 0.4134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.5106, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 45%|####5 | 50/111 [00:30<00:41, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9628, LAS: 0.9316, UEM: 0.6238, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2636, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.5083, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||: 49%|####8 | 54/111 [00:33<00:39, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9632, LAS: 0.9320, UEM: 0.6408, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.5037, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 51%|#####1 | 57/111 [00:35<00:39, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9324, UEM: 0.6484, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.5000, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 54%|#####4 | 60/111 [00:37<00:36, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9638, LAS: 0.9326, UEM: 0.6474, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4825, loss: 0.4986, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 57%|#####6 | 63/111 [00:39<00:34, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9625, LAS: 0.9312, UEM: 0.6366, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9148, partial_loss/deprel_loss: 0.4920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.5080, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 60%|###### | 67/111 [00:42<00:30, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9625, LAS: 0.9313, UEM: 0.6407, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4629, loss: 0.5070, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 63%|######3 | 70/111 [00:44<00:28, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9623, LAS: 0.9311, UEM: 0.6390, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5082, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 66%|######5 | 73/111 [00:46<00:26, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9628, LAS: 0.9315, UEM: 0.6497, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0792, partial_loss/deprel_loss: 0.2490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3733, loss: 0.5059, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 68%|######8 | 76/111 [00:49<00:26, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9626, LAS: 0.9311, UEM: 0.6497, LEM: 0.4388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1317, partial_loss/deprel_loss: 0.2263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3656, loss: 0.5085, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 71%|#######1 | 79/111 [00:51<00:23, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9628, LAS: 0.9313, UEM: 0.6545, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.5078, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 75%|#######4 | 83/111 [00:53<00:19, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9630, LAS: 0.9315, UEM: 0.6547, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.5069, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 77%|#######7 | 86/111 [00:55<00:17, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9633, LAS: 0.9316, UEM: 0.6556, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2261, partial_loss/deprel_loss: 0.3324, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4693, loss: 0.5058, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 80%|######## | 89/111 [00:57<00:15, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9631, LAS: 0.9313, UEM: 0.6521, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2621, partial_loss/deprel_loss: 0.2951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.5071, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 83%|########2 | 92/111 [01:00<00:13, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9633, LAS: 0.9317, UEM: 0.6672, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0490, partial_loss/deprel_loss: 0.1049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2518, loss: 0.5055, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||: 86%|########5 | 95/111 [01:03<00:12, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9637, LAS: 0.9318, UEM: 0.6667, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3139, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5279, loss: 0.5045, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||: 89%|########9 | 99/111 [01:05<00:08, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9638, LAS: 0.9319, UEM: 0.6678, LEM: 0.4559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1525, partial_loss/deprel_loss: 0.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3949, loss: 0.5033, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||: 92%|#########1| 102/111 [01:07<00:06, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9633, LAS: 0.9314, UEM: 0.6613, LEM: 0.4506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5928, loss: 0.5068, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||: 95%|#########4| 105/111 [01:09<00:04, 1.36it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9629, LAS: 0.9311, UEM: 0.6577, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4233, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.5092, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||: 97%|#########7| 108/111 [01:12<00:02, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9632, LAS: 0.9313, UEM: 0.6598, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1641, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5077, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:52:21,453 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.287 | N/A\n", + "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.164 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - reg_loss | 0.158 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UEM | 0.660 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - loss | 0.508 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEM | 0.447 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EM | 0.944 | N/A\n", + "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:52:21,460 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:52:29,124 - INFO - combo.training.trainer - Epoch duration: 0:01:24.786423\n", + "2023-04-07 01:52:29,125 - INFO - combo.training.trainer - Estimated training time remaining: 6:06:46\n", + "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Epoch 133/399\n", + "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:52:29,126 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:52:29,137 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9731, LAS: 0.9427, UEM: 0.7832, LEM: 0.5870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.4103, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 5%|4 | 5/111 [00:02<00:52, 2.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9658, LAS: 0.9356, UEM: 0.7113, LEM: 0.5108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3312, partial_loss/deprel_loss: 0.3483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5030, loss: 0.4581, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 7%|7 | 8/111 [00:04<00:59, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9656, LAS: 0.9347, UEM: 0.7061, LEM: 0.4976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3322, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.4600, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 10%|9 | 11/111 [00:06<01:02, 1.61it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9632, LAS: 0.9318, UEM: 0.6725, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7018, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.4809, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 13%|#2 | 14/111 [00:08<01:02, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9634, LAS: 0.9313, UEM: 0.6568, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1925, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.4887, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 15%|#5 | 17/111 [00:11<01:02, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9628, LAS: 0.9303, UEM: 0.6486, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2312, partial_loss/deprel_loss: 0.2814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.4948, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 18%|#8 | 20/111 [00:13<01:03, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9638, LAS: 0.9312, UEM: 0.6779, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7755, partial_loss/deprel_loss: 0.4929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.4923, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||: 21%|## | 23/111 [00:15<01:01, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9652, LAS: 0.9330, UEM: 0.7083, LEM: 0.4995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0606, partial_loss/deprel_loss: 0.1413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2832, loss: 0.4807, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 23%|##3 | 26/111 [00:18<01:02, 1.36it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9646, LAS: 0.9325, UEM: 0.7066, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.3893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5661, loss: 0.4855, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 26%|##6 | 29/111 [00:20<00:59, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9635, LAS: 0.9313, UEM: 0.6873, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.4968, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 30%|##9 | 33/111 [00:22<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9639, LAS: 0.9316, UEM: 0.6871, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4994, loss: 0.4923, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 32%|###2 | 36/111 [00:24<00:53, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9619, LAS: 0.9301, UEM: 0.6684, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6564, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6154, loss: 0.5014, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 36%|###6 | 40/111 [00:27<00:48, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9617, LAS: 0.9298, UEM: 0.6542, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5085, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6397, loss: 0.5079, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||: 40%|###9 | 44/111 [00:29<00:44, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9625, LAS: 0.9306, UEM: 0.6561, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.5018, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 43%|####3 | 48/111 [00:32<00:40, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9626, LAS: 0.9304, UEM: 0.6582, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1578, partial_loss/deprel_loss: 0.2982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.5035, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 47%|####6 | 52/111 [00:35<00:39, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9627, LAS: 0.9306, UEM: 0.6538, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5034, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 50%|##### | 56/111 [00:38<00:38, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9630, LAS: 0.9310, UEM: 0.6533, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5006, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 53%|#####3 | 59/111 [00:40<00:35, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9634, LAS: 0.9315, UEM: 0.6593, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.4973, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 56%|#####5 | 62/111 [00:42<00:34, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9632, LAS: 0.9313, UEM: 0.6543, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4943, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6070, loss: 0.4994, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||: 59%|#####8 | 65/111 [00:44<00:33, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9637, LAS: 0.9317, UEM: 0.6609, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2084, partial_loss/deprel_loss: 0.2780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4221, loss: 0.4958, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 61%|######1 | 68/111 [00:47<00:32, 1.31it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9776, UAS: 0.9645, LAS: 0.9327, UEM: 0.6818, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0263, partial_loss/deprel_loss: 0.0802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2273, loss: 0.4900, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 65%|######4 | 72/111 [00:50<00:29, 1.33it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9648, LAS: 0.9329, UEM: 0.6870, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.4877, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 68%|######7 | 75/111 [00:52<00:27, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9645, LAS: 0.9325, UEM: 0.6847, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2349, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4920, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 71%|#######1 | 79/111 [00:55<00:23, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9640, LAS: 0.9320, UEM: 0.6775, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7113, partial_loss/deprel_loss: 0.4739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.4946, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 75%|#######4 | 83/111 [00:57<00:19, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9639, LAS: 0.9317, UEM: 0.6702, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.4979, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 78%|#######8 | 87/111 [01:00<00:16, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9635, LAS: 0.9313, UEM: 0.6640, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.5010, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 81%|########1 | 90/111 [01:02<00:14, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9631, LAS: 0.9310, UEM: 0.6608, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.5039, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 85%|########4 | 94/111 [01:04<00:11, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9634, LAS: 0.9313, UEM: 0.6633, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.5020, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 88%|########8 | 98/111 [01:07<00:08, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9631, LAS: 0.9310, UEM: 0.6651, LEM: 0.4536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1180, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3632, loss: 0.5052, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 92%|#########1| 102/111 [01:09<00:05, 1.59it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9632, LAS: 0.9310, UEM: 0.6633, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5050, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||: 96%|#########6| 107/111 [01:11<00:02, 1.74it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9630, LAS: 0.9308, UEM: 0.6586, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2975, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.5058, batch_reg_loss: 0.1578, reg_loss: 0.1580 ||: 100%|##########| 111/111 [01:13<00:00, 1.51it/s]\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.287 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.297 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - reg_loss | 0.158 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UEM | 0.659 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LAS | 0.931 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - loss | 0.506 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEM | 0.446 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EM | 0.939 | N/A\n", + "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:53:46,012 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Epoch duration: 0:01:21.642784\n", + "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Estimated training time remaining: 6:05:22\n", + "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Epoch 134/399\n", + "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:53:50,769 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:53:50,776 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9718, LAS: 0.9412, UEM: 0.7633, LEM: 0.5488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.3260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.4079, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 3%|2 | 3/111 [00:02<01:31, 1.18it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9762, LAS: 0.9468, UEM: 0.8419, LEM: 0.6702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2195, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4255, loss: 0.3891, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 5%|5 | 6/111 [00:05<01:29, 1.17it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9733, LAS: 0.9431, UEM: 0.8027, LEM: 0.6205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5134, partial_loss/deprel_loss: 0.4853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.4243, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 8%|8 | 9/111 [00:07<01:24, 1.21it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9699, LAS: 0.9392, UEM: 0.7601, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2198, partial_loss/deprel_loss: 0.2679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4161, loss: 0.4574, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 11%|# | 12/111 [00:09<01:19, 1.25it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9700, LAS: 0.9394, UEM: 0.7412, LEM: 0.5441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3738, loss: 0.4592, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 14%|#4 | 16/111 [00:12<01:13, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9695, LAS: 0.9389, UEM: 0.7309, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.4606, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 17%|#7 | 19/111 [00:14<01:09, 1.32it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9663, LAS: 0.9359, UEM: 0.7046, LEM: 0.5065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7200, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.4794, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 20%|#9 | 22/111 [00:16<01:06, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9653, LAS: 0.9347, UEM: 0.6950, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2095, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4847, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 23%|##3 | 26/111 [00:19<00:59, 1.43it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9653, LAS: 0.9347, UEM: 0.6830, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4296, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.4861, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 26%|##6 | 29/111 [00:21<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9645, LAS: 0.9338, UEM: 0.6744, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8113, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.4907, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 29%|##8 | 32/111 [00:23<00:54, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9649, LAS: 0.9343, UEM: 0.6683, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4405, loss: 0.4874, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 32%|###2 | 36/111 [00:25<00:50, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9644, LAS: 0.9336, UEM: 0.6664, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3603, partial_loss/deprel_loss: 0.3563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.4898, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||: 35%|###5 | 39/111 [00:27<00:49, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9648, LAS: 0.9339, UEM: 0.6610, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3040, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.4882, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 39%|###8 | 43/111 [00:30<00:44, 1.54it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9658, LAS: 0.9349, UEM: 0.6893, LEM: 0.4781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0704, partial_loss/deprel_loss: 0.1725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3098, loss: 0.4800, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 42%|####2 | 47/111 [00:33<00:43, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9647, LAS: 0.9337, UEM: 0.6763, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6020, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6392, loss: 0.4875, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 45%|####5 | 50/111 [00:35<00:42, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9651, LAS: 0.9342, UEM: 0.6885, LEM: 0.4830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5349, loss: 0.4831, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 48%|####7 | 53/111 [00:37<00:41, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9645, LAS: 0.9335, UEM: 0.6874, LEM: 0.4803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8582, partial_loss/deprel_loss: 0.5299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.4878, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 50%|##### | 56/111 [00:39<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9646, LAS: 0.9337, UEM: 0.6868, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.4881, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 53%|#####3 | 59/111 [00:41<00:36, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9632, LAS: 0.9320, UEM: 0.6767, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3082, partial_loss/deprel_loss: 0.5926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.4992, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 57%|#####6 | 63/111 [00:44<00:32, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9318, UEM: 0.6657, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.5014, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 60%|###### | 67/111 [00:46<00:29, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9629, LAS: 0.9317, UEM: 0.6634, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1659, partial_loss/deprel_loss: 0.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4145, loss: 0.5002, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 64%|######3 | 71/111 [00:50<00:29, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9411, UAS: 0.9631, LAS: 0.9319, UEM: 0.6611, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2327, partial_loss/deprel_loss: 0.2979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4989, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 68%|######7 | 75/111 [00:52<00:24, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9624, LAS: 0.9312, UEM: 0.6529, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6647, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.5027, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 71%|#######1 | 79/111 [00:55<00:21, 1.46it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9625, LAS: 0.9314, UEM: 0.6539, LEM: 0.4423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1623, partial_loss/deprel_loss: 0.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3610, loss: 0.5015, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||: 74%|#######3 | 82/111 [00:57<00:20, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9631, LAS: 0.9319, UEM: 0.6668, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0680, partial_loss/deprel_loss: 0.1759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3119, loss: 0.4982, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 77%|#######7 | 86/111 [01:00<00:17, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9634, LAS: 0.9321, UEM: 0.6686, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4434, loss: 0.4973, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 81%|########1 | 90/111 [01:02<00:13, 1.56it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9634, LAS: 0.9322, UEM: 0.6708, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1608, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3713, loss: 0.4965, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 86%|########5 | 95/111 [01:04<00:09, 1.67it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9634, LAS: 0.9321, UEM: 0.6702, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3192, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4710, loss: 0.4978, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 90%|######### | 100/111 [01:07<00:06, 1.81it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9633, LAS: 0.9318, UEM: 0.6683, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3566, partial_loss/deprel_loss: 0.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5360, loss: 0.5001, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 94%|#########3| 104/111 [01:09<00:04, 1.72it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9633, LAS: 0.9319, UEM: 0.6666, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2006, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.4998, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 97%|#########7| 108/111 [01:12<00:01, 1.69it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9632, LAS: 0.9319, UEM: 0.6637, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.2592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4131, loss: 0.4991, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 100%|##########| 111/111 [01:13<00:00, 1.50it/s]\n", + "2023-04-07 01:55:07,230 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.259 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.241 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - reg_loss | 0.158 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UEM | 0.664 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LAS | 0.932 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - loss | 0.499 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEM | 0.449 | N/A\n", + "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | N/A\n", + "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | N/A\n", + "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | N/A\n", + "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | N/A\n", + "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EM | 0.943 | N/A\n", + "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:55:07,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:55:11,923 - INFO - combo.training.trainer - Epoch duration: 0:01:21.154867\n", + "2023-04-07 01:55:11,924 - INFO - combo.training.trainer - Estimated training time remaining: 6:03:57\n", + "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Epoch 135/399\n", + "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:55:11,925 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:55:11,933 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9691, LAS: 0.9380, UEM: 0.5843, LEM: 0.3390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2373, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.4858, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||: 4%|3 | 4/111 [00:02<01:06, 1.62it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9676, LAS: 0.9361, UEM: 0.6419, LEM: 0.3989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.3518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5195, loss: 0.4727, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||: 6%|6 | 7/111 [00:04<01:09, 1.49it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9674, LAS: 0.9363, UEM: 0.6454, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4563, partial_loss/deprel_loss: 0.3694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.4696, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||: 9%|9 | 10/111 [00:07<01:10, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9644, LAS: 0.9332, UEM: 0.6007, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.4970, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||: 13%|#2 | 14/111 [00:09<01:04, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9651, LAS: 0.9338, UEM: 0.6030, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.4959, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 15%|#5 | 17/111 [00:11<01:03, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9668, LAS: 0.9357, UEM: 0.6544, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1150, partial_loss/deprel_loss: 0.1990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3397, loss: 0.4817, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 18%|#8 | 20/111 [00:13<01:03, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9659, LAS: 0.9352, UEM: 0.6471, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.4032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5988, loss: 0.4846, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 21%|## | 23/111 [00:16<01:03, 1.38it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9641, LAS: 0.9333, UEM: 0.6212, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3112, partial_loss/deprel_loss: 0.3003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4600, loss: 0.4957, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 24%|##4 | 27/111 [00:18<00:59, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9648, LAS: 0.9337, UEM: 0.6407, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.4937, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 27%|##7 | 30/111 [00:20<00:56, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9644, LAS: 0.9333, UEM: 0.6349, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5316, loss: 0.4975, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||: 30%|##9 | 33/111 [00:23<00:54, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9655, LAS: 0.9345, UEM: 0.6660, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1504, partial_loss/deprel_loss: 0.2351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3756, loss: 0.4871, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 32%|###2 | 36/111 [00:26<01:04, 1.16it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9662, LAS: 0.9350, UEM: 0.6732, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.2917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4273, loss: 0.4840, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 35%|###5 | 39/111 [00:28<00:58, 1.23it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9670, LAS: 0.9356, UEM: 0.6809, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1688, partial_loss/deprel_loss: 0.2671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4049, loss: 0.4804, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 38%|###7 | 42/111 [00:31<00:54, 1.27it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9672, LAS: 0.9359, UEM: 0.6859, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1178, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3628, loss: 0.4778, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 41%|#### | 45/111 [00:33<00:50, 1.30it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9668, LAS: 0.9354, UEM: 0.6857, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2961, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.4803, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 43%|####3 | 48/111 [00:35<00:46, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9666, LAS: 0.9353, UEM: 0.6826, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.4821, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 47%|####6 | 52/111 [00:37<00:42, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9658, LAS: 0.9346, UEM: 0.6777, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7723, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6948, loss: 0.4863, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||: 50%|####9 | 55/111 [00:39<00:39, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9643, LAS: 0.9332, UEM: 0.6707, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9087, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.4946, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 52%|#####2 | 58/111 [00:42<00:38, 1.39it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9643, LAS: 0.9332, UEM: 0.6744, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3684, loss: 0.4935, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 56%|#####5 | 62/111 [00:44<00:34, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9634, LAS: 0.9321, UEM: 0.6687, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2048, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 0.5009, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 59%|#####8 | 65/111 [00:46<00:32, 1.43it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9634, LAS: 0.9317, UEM: 0.6662, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7750, partial_loss/deprel_loss: 0.5395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.5028, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 62%|######2 | 69/111 [00:49<00:27, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9630, LAS: 0.9314, UEM: 0.6552, LEM: 0.4332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5066, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 67%|######6 | 74/111 [00:51<00:22, 1.64it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9623, LAS: 0.9308, UEM: 0.6477, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.2618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4030, loss: 0.5100, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 70%|####### | 78/111 [00:54<00:20, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9625, LAS: 0.9310, UEM: 0.6503, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2958, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5183, loss: 0.5094, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 74%|#######3 | 82/111 [00:56<00:18, 1.60it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9623, LAS: 0.9308, UEM: 0.6431, LEM: 0.4219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5388, loss: 0.5104, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 77%|#######7 | 86/111 [00:59<00:15, 1.66it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9800, UAS: 0.9630, LAS: 0.9316, UEM: 0.6675, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0234, partial_loss/deprel_loss: 0.0818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2275, loss: 0.5049, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 81%|########1 | 90/111 [01:01<00:13, 1.56it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9625, LAS: 0.9312, UEM: 0.6606, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6511, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 0.5073, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 86%|########5 | 95/111 [01:04<00:09, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9624, LAS: 0.9311, UEM: 0.6529, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3028, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4740, loss: 0.5081, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 90%|######### | 100/111 [01:06<00:06, 1.79it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9629, LAS: 0.9315, UEM: 0.6583, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5472, loss: 0.5050, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||: 95%|#########4| 105/111 [01:09<00:03, 1.90it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9260, UAS: 0.9632, LAS: 0.9317, UEM: 0.6619, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4365, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5709, loss: 0.5032, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||: 98%|#########8| 109/111 [01:11<00:01, 1.78it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9632, LAS: 0.9317, UEM: 0.6597, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5031, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||: 100%|##########| 111/111 [01:13<00:00, 1.52it/s]\n", + "2023-04-07 01:56:27,897 - INFO - allennlp.training.trainer - Validating\n", + " 0%| | 0/13 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9614, LAS: 0.9128, UEM: 0.7969, LEM: 0.5543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 34.5376, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8322, loss: 19.9957, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 23%|##3 | 3/13 [00:02<00:09, 1.01it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9551, LAS: 0.9059, UEM: 0.7413, LEM: 0.4867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3425, partial_loss/deprel_loss: 44.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 35.9504, loss: 23.2370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 46%|####6 | 6/13 [00:05<00:06, 1.03it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9458, LAS: 0.8954, UEM: 0.6814, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7257, partial_loss/deprel_loss: 28.0299, partial_loss/cycle_loss: 0.0000, batch_loss: 22.5690, loss: 25.5143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 62%|######1 | 8/13 [00:07<00:04, 1.00it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9509, LAS: 0.9015, UEM: 0.6917, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 24.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9122, loss: 23.2583, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 85%|########4 | 11/13 [00:10<00:01, 1.02it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9485, LAS: 0.8984, UEM: 0.6581, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9117, partial_loss/deprel_loss: 29.0845, partial_loss/cycle_loss: 0.0000, batch_loss: 23.4500, loss: 23.9880, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00, 1.03it/s]\n", + "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - Training | Validation\n", + "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - ELEM | 0.000 | 0.000\n", + "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - XPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UPOS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - ELAS | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - patience | 1.000 | N/A\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - SEMREL_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUEM | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss | 0.383 | 29.085\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss | 0.461 | 0.912\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - reg_loss | 0.157 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UEM | 0.660 | 0.658\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LAS | 0.932 | 0.898\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - loss | 0.503 | 23.988\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB | 2425.273 | N/A\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEM | 0.448 | 0.396\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEMMA_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUAS | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UAS | 0.963 | 0.949\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - FEATS_ACC | 0.000 | 0.000\n", + "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EM | 0.921 | 0.884\n", + "2023-04-07 01:56:40,530 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB | 7070.324 | N/A\n", + "2023-04-07 01:56:40,533 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n", + "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Epoch duration: 0:01:32.824060\n", + "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Estimated training time remaining: 6:02:55\n", + "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Epoch 136/399\n", + "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n", + "2023-04-07 01:56:44,750 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n", + "2023-04-07 01:56:44,759 - INFO - allennlp.training.trainer - Training\n", + " 0%| | 0/111 [00:00<?, ?it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9701, LAS: 0.9398, UEM: 0.6759, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1820, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.4615, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 4%|3 | 4/111 [00:02<01:11, 1.49it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9697, LAS: 0.9401, UEM: 0.7084, LEM: 0.4874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4933, partial_loss/deprel_loss: 0.3671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.4480, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 7%|7 | 8/111 [00:05<01:07, 1.52it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9687, LAS: 0.9379, UEM: 0.6801, LEM: 0.4486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2307, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.4613, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 10%|9 | 11/111 [00:07<01:06, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9682, LAS: 0.9380, UEM: 0.6869, LEM: 0.4659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1802, partial_loss/deprel_loss: 0.2410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3861, loss: 0.4555, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 14%|#3 | 15/111 [00:09<01:03, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9685, LAS: 0.9379, UEM: 0.6714, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4714, loss: 0.4577, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 17%|#7 | 19/111 [00:12<01:01, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9658, LAS: 0.9350, UEM: 0.6613, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9620, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.4760, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 21%|## | 23/111 [00:15<00:58, 1.51it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9653, LAS: 0.9344, UEM: 0.6476, LEM: 0.4248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5369, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.4804, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 23%|##3 | 26/111 [00:17<00:57, 1.48it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9657, LAS: 0.9349, UEM: 0.6618, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.4762, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 26%|##6 | 29/111 [00:19<00:57, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9647, LAS: 0.9336, UEM: 0.6680, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0720, partial_loss/deprel_loss: 0.2051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.4839, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||: 29%|##8 | 32/111 [00:21<00:57, 1.37it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9650, LAS: 0.9338, UEM: 0.6674, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1642, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3932, loss: 0.4823, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 32%|###2 | 36/111 [00:24<00:54, 1.38it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9646, LAS: 0.9335, UEM: 0.6565, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4016, partial_loss/deprel_loss: 0.3892, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5489, loss: 0.4877, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 35%|###5 | 39/111 [00:26<00:51, 1.40it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9645, LAS: 0.9335, UEM: 0.6487, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.4894, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 38%|###7 | 42/111 [00:28<00:48, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9646, LAS: 0.9337, UEM: 0.6573, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0802, partial_loss/deprel_loss: 0.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3153, loss: 0.4892, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 41%|####1 | 46/111 [00:31<00:45, 1.41it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9645, LAS: 0.9333, UEM: 0.6492, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 45%|####5 | 50/111 [00:34<00:41, 1.47it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9644, LAS: 0.9332, UEM: 0.6480, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6622, partial_loss/deprel_loss: 0.4969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.4916, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 49%|####8 | 54/111 [00:36<00:37, 1.50it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9653, LAS: 0.9342, UEM: 0.6665, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4853, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 52%|#####2 | 58/111 [00:38<00:33, 1.58it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9645, LAS: 0.9335, UEM: 0.6710, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5423, partial_loss/deprel_loss: 0.4684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.4904, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||: 56%|#####5 | 62/111 [00:41<00:29, 1.68it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9643, LAS: 0.9335, UEM: 0.6663, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||: 60%|###### | 67/111 [00:43<00:24, 1.83it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9639, LAS: 0.9331, UEM: 0.6543, LEM: 0.4413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3624, partial_loss/deprel_loss: 0.3598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5175, loss: 0.4936, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||: 65%|######4 | 72/111 [00:45<00:20, 1.93it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9639, LAS: 0.9333, UEM: 0.6653, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4176, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5278, loss: 0.4929, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||: 68%|######8 | 76/111 [00:48<00:20, 1.75it/s]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9643, LAS: 0.9336, UEM: 0.6732, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1612, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4059, loss: 0.4902, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||: 72%|#######2 | 80/111 [00:51<00:19, 1.55it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9637, LAS: 0.9332, UEM: 0.6708, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.4919, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 76%|#######5 | 84/111 [00:54<00:18, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9633, LAS: 0.9327, UEM: 0.6642, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7168, loss: 0.4959, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 79%|#######9 | 88/111 [00:57<00:16, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9628, LAS: 0.9321, UEM: 0.6605, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.4999, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 82%|########1 | 91/111 [01:00<00:14, 1.35it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9626, LAS: 0.9319, UEM: 0.6593, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.5013, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 85%|########4 | 94/111 [01:02<00:12, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9628, LAS: 0.9321, UEM: 0.6646, LEM: 0.4604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1742, partial_loss/deprel_loss: 0.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3536, loss: 0.4988, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 87%|########7 | 97/111 [01:04<00:10, 1.29it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9628, LAS: 0.9321, UEM: 0.6630, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4777, partial_loss/deprel_loss: 0.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.4990, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 90%|######### | 100/111 [01:06<00:08, 1.34it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9631, LAS: 0.9322, UEM: 0.6644, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3459, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.4976, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 94%|#########3| 104/111 [01:09<00:04, 1.45it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9630, LAS: 0.9320, UEM: 0.6604, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3434, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.4983, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 96%|#########6| 107/111 [01:11<00:02, 1.44it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00, 1.42it/s]\n", + "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00, 1.50it/s]\n", + "2023-04-07 01:58:01,554 - INFO - combo.training.trainer - Ran out of patience. Stopping training.\n", + "2023-04-07 01:58:01,554 - INFO - allennlp.training.checkpointer - loading best weights\n", + "2023-04-07 01:58:02,804 - INFO - allennlp.common.util - Metrics: {\n", + " \"best_epoch\": 135,\n", + " \"peak_worker_0_memory_MB\": 7070.32421875,\n", + " \"peak_gpu_0_memory_MB\": 2425.27294921875,\n", + " \"training_duration\": \"3:06:53.221860\",\n", + " \"training_start_epoch\": 0,\n", + " \"training_epochs\": 135,\n", + " \"epoch\": 135,\n", + " \"training_UPOS_ACC\": 0.0,\n", + " \"training_XPOS_ACC\": 0.0,\n", + " \"training_SEMREL_ACC\": 0.0,\n", + " \"training_LEMMA_ACC\": 0.0,\n", + " \"training_FEATS_ACC\": 0.0,\n", + " \"training_EM\": 0.9211469292640686,\n", + " \"training_UAS\": 0.9631774675364263,\n", + " \"training_LAS\": 0.9317305657860291,\n", + " \"training_UEM\": 0.6596950631978689,\n", + " \"training_LEM\": 0.4481664116080032,\n", + " \"training_EUAS\": 0.0,\n", + " \"training_ELAS\": 0.0,\n", + " \"training_EUEM\": 0.0,\n", + " \"training_ELEM\": 0.0,\n", + " \"training_partial_loss/head_loss\": 0.4608195722103119,\n", + " \"training_partial_loss/deprel_loss\": 0.3828725218772888,\n", + " \"training_partial_loss/cycle_loss\": 0.0,\n", + " \"training_loss\": 0.5030799737653217,\n", + " \"training_reg_loss\": 0.15746027405734533,\n", + " \"training_worker_0_memory_MB\": 7070.32421875,\n", + " \"training_gpu_0_memory_MB\": 2425.27294921875,\n", + " \"training_patience\": 1,\n", + " \"validation_UPOS_ACC\": 0.0,\n", + " \"validation_XPOS_ACC\": 0.0,\n", + " \"validation_SEMREL_ACC\": 0.0,\n", + " \"validation_LEMMA_ACC\": 0.0,\n", + " \"validation_FEATS_ACC\": 0.0,\n", + " \"validation_EM\": 0.8841390609741211,\n", + " \"validation_UAS\": 0.948533243417221,\n", + " \"validation_LAS\": 0.898415228519756,\n", + " \"validation_UEM\": 0.6580882352941176,\n", + " \"validation_LEM\": 0.3961397058823529,\n", + " \"validation_EUAS\": 0.0,\n", + " \"validation_ELAS\": 0.0,\n", + " \"validation_EUEM\": 0.0,\n", + " \"validation_ELEM\": 0.0,\n", + " \"validation_partial_loss/head_loss\": 0.91168212890625,\n", + " \"validation_partial_loss/deprel_loss\": 29.084543228149414,\n", + " \"validation_partial_loss/cycle_loss\": 0.0,\n", + " \"validation_loss\": 23.987967637869026,\n", + " \"validation_reg_loss\": 0.0,\n", + " \"best_validation_UPOS_ACC\": 0.0,\n", + " \"best_validation_XPOS_ACC\": 0.0,\n", + " \"best_validation_SEMREL_ACC\": 0.0,\n", + " \"best_validation_LEMMA_ACC\": 0.0,\n", + " \"best_validation_FEATS_ACC\": 0.0,\n", + " \"best_validation_EM\": 0.8841390609741211,\n", + " \"best_validation_UAS\": 0.948533243417221,\n", + " \"best_validation_LAS\": 0.898415228519756,\n", + " \"best_validation_UEM\": 0.6580882352941176,\n", + " \"best_validation_LEM\": 0.3961397058823529,\n", + " \"best_validation_EUAS\": 0.0,\n", + " \"best_validation_ELAS\": 0.0,\n", + " \"best_validation_EUEM\": 0.0,\n", + " \"best_validation_ELEM\": 0.0,\n", + " \"best_validation_partial_loss/head_loss\": 0.91168212890625,\n", + " \"best_validation_partial_loss/deprel_loss\": 29.084543228149414,\n", + " \"best_validation_partial_loss/cycle_loss\": 0.0,\n", + " \"best_validation_loss\": 23.987967637869026,\n", + " \"best_validation_reg_loss\": 0.0\n", + "}\n", + "2023-04-07 01:58:02,805 - INFO - allennlp.models.archival - archiving weights and vocabulary to ./allennlpru3hb8qq/model.tar.gz\n", + "2023-04-07 02:10:56,965 - INFO - combo.main - Training model stored in: ./allennlpru3hb8qq\n" + ] + } + ], + "source": [ + "! {COMBO} --mode train \\\n", + " --training_data_path connlu/pdbc-train.conllu \\\n", + " --validation_data_path connlu/pdbc-validation.conllu \\\n", + " --cuda_device 0 \\\n", + " --pretrained_transformer_name allegro/herbert-large-cased \\\n", + " --targets head,deprel \\\n", + " --serialization_dir ." + ] + }, + { + "cell_type": "markdown", + "id": "e2c0090a", + "metadata": {}, + "source": [ + "Change `allennlp...` to the directory produced by COMBO." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "f630757b", + "metadata": {}, + "outputs": [], + "source": [ + "! rm -r model-pdbc/\n", + "! mv allennlpru3hb8qq/ model-pdbc/" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "combo_python39", + "language": "python", + "name": "combo_python39" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.16" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/TrainingAndEval.ipynb a/TrainingAndEval.ipynb new file mode 100644 index 0000000..753718e --- /dev/null +++ a/TrainingAndEval.ipynb @@ -0,0 +1,1546 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "97d0c9ab", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2023-04-11 11:17:29.095631: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA\n", + "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", + "2023-04-11 11:17:29.331444: E tensorflow/stream_executor/cuda/cuda_blas.cc:2981] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n", + "2023-04-11 11:17:30.167497: W tensorflow/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory\n", + "2023-04-11 11:17:30.167593: W tensorflow/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory\n", + "2023-04-11 11:17:30.167603: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n" + ] + } + ], + "source": [ + "import importlib\n", + "\n", + "from collections import Counter\n", + "\n", + "import tensorflow as tf\n", + "\n", + "from datasets import load_dataset\n", + "from IPython.display import display, HTML, IFrame" + ] + }, + { + "cell_type": "markdown", + "id": "7464a6fa", + "metadata": {}, + "source": [ + "**Comment out to use GPU!**" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "c41d6630", + "metadata": {}, + "outputs": [], + "source": [ + "#import os\n", + "#os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"-1\"" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "f30d7b7c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "1 Physical GPUs, 1 Logical GPUs\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2023-04-11 11:17:31.717262: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:31.762533: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:31.763529: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:31.765670: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA\n", + "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", + "2023-04-11 11:17:31.769196: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:31.770058: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:31.770816: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.722287: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.723281: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.724062: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.724846: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1616] Created device /job:localhost/replica:0/task:0/device:GPU:0 with 20480 MB memory: -> device: 0, name: NVIDIA A100 80GB PCIe, pci bus id: 0000:00:05.0, compute capability: 8.0\n" + ] + } + ], + "source": [ + "# https://www.tensorflow.org/guide/gpu\n", + "gpus = tf.config.list_physical_devices('GPU')\n", + "if gpus:\n", + " try:\n", + " tf.config.set_logical_device_configuration(\n", + " gpus[0],\n", + " [tf.config.LogicalDeviceConfiguration(memory_limit=20*1024)]\n", + " )\n", + " logical_gpus = tf.config.list_logical_devices('GPU')\n", + " print(len(gpus), \"Physical GPUs,\", len(logical_gpus), \"Logical GPUs\")\n", + " except RuntimeError as e:\n", + " print(e)" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "89afdb1e", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "/device:GPU:0\n", + "2.10.0\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2023-04-11 11:17:32.739308: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.740224: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.740975: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.741809: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.742586: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n", + "2023-04-11 11:17:32.743322: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1616] Created device /device:GPU:0 with 20480 MB memory: -> device: 0, name: NVIDIA A100 80GB PCIe, pci bus id: 0000:00:05.0, compute capability: 8.0\n" + ] + } + ], + "source": [ + "print(tf.test.gpu_device_name())\n", + "print(tf.__version__)" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "2b0ab576", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "55f181333dc44c7a811c515cc55c4988", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/3 [00:00<?, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "pdbc_dataset = load_dataset('pdb_c_beta')" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "2f4c317a", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-ff2490f308f7f25b.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-cbb40b0e978ab6ee.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-3facbd810991cd6c.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-e54a8628e59de21f.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-9692de6b8224e758.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-4042ffa1dc5d9323.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-fb250709424f85ec.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-1f6ce0a488a89d56.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-2ae4daf5101c7aa2.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-a1686820d15bcf04.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-fe2c12481861f4bd.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-da5a875c385c3570.arrow\n" + ] + } + ], + "source": [ + "import importlib\n", + "\n", + "from neural_parser import hybrid_tree_utils\n", + "importlib.reload(hybrid_tree_utils)\n", + "from neural_parser import dataset_utils\n", + "importlib.reload(dataset_utils)\n", + "\n", + "pdbc_dataset_spines = dataset_utils.add_spines_and_attachments(pdbc_dataset)\n", + "pdbc_dataset_spines_compressed = dataset_utils.add_spines_and_attachments(pdbc_dataset, compress=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "de1966ed", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-1dfcf507d62f6da8.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-264c0111246b25c1.arrow\n", + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-6a40675124a412f0.arrow\n" + ] + } + ], + "source": [ + "features = pdbc_dataset_spines['train'].features\n", + "pdbc_dataset_spines_cont = pdbc_dataset_spines.filter(\n", + " lambda instance: hybrid_tree_utils.tree_from_dataset_instance(instance, features).is_continuous()\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "33ff295b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "DatasetDict({\n", + " train: Dataset({\n", + " features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n", + " num_rows: 15903\n", + " })\n", + " validation: Dataset({\n", + " features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n", + " num_rows: 1980\n", + " })\n", + " test: Dataset({\n", + " features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n", + " num_rows: 1990\n", + " })\n", + "})" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pdbc_dataset_spines_cont" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "a8ddbc1f", + "metadata": {}, + "outputs": [], + "source": [ + "MODEL = 'allegro/herbert-large-cased'" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "8029594b", + "metadata": {}, + "outputs": [], + "source": [ + "class ClassificationTask(object):\n", + " \n", + " def __init__(\n", + " self,\n", + " name,\n", + " dataset,\n", + " ):\n", + " self.name = name\n", + " self.dataset = dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "id": "be8e93fa", + "metadata": {}, + "outputs": [], + "source": [ + "def crop(dataset, n):\n", + " return dataset.filter(lambda example: len(example['tokens']) <= n)\n", + "\n", + "spines_pdbc = ClassificationTask(\n", + " 'spines_pdbc',\n", + " pdbc_dataset_spines,\n", + " #crop(pdbc_dataset, 6),\n", + ")\n", + "\n", + "spines_pdbc_cont = ClassificationTask(\n", + " 'spines_pdbc_cont',\n", + " pdbc_dataset_spines_cont,\n", + " #crop(pdbc_dataset, 6),\n", + ")\n", + "\n", + "spines_pdbc_compressed = ClassificationTask(\n", + " 'spines_pdbc_compressed',\n", + " pdbc_dataset_spines_compressed,\n", + " #crop(pdbc_dataset, 6),\n", + ")\n", + "\n", + "TASK = spines_pdbc_compressed\n", + "TRAIN = False" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "7824fcee", + "metadata": {}, + "outputs": [], + "source": [ + "from neural_parser import training" + ] + }, + { + "cell_type": "code", + "execution_count": 38, + "id": "1eb5f41a", + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Loading BERT tokenizer...\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-49fe5b05228c3588.arrow\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Preprocessing the dataset for BERT...\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "5f108b00fcab4db8a610f24ae03b7308", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/2211 [00:00<?, ?ex/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-b8e2900fbd9615fd.arrow\n", + "You're using a HerbertTokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.\n" + ] + } + ], + "source": [ + "trainer = training.Trainer(\n", + " MODEL,\n", + " dataset=TASK.dataset,\n", + " batch_size=16,\n", + ")" + ] + }, + { + "cell_type": "markdown", + "id": "ac012dc7", + "metadata": {}, + "source": [ + "### Training with TensorBoard logging" + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "id": "276708cc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "('keras_fit_logs_spines_pdbc_compressed', 'models_spines_pdbc_compressed')" + ] + }, + "execution_count": 39, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "log_dir = f'keras_fit_logs_{TASK.name}'\n", + "model_dir = f'models_{TASK.name}'\n", + "\n", + "log_dir, model_dir" + ] + }, + { + "cell_type": "code", + "execution_count": 40, + "id": "e8ccde06", + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The tensorboard extension is already loaded. To reload it, use:\n", + " %reload_ext tensorboard\n", + "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n", + "To disable this warning, you can either:\n", + "\t- Avoid using `tokenizers` before the fork if possible\n", + "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n" + ] + }, + { + "data": { + "text/html": [ + "\n", + " <iframe id=\"tensorboard-frame-83a6a03964d4187a\" width=\"100%\" height=\"800\" frameborder=\"0\">\n", + " </iframe>\n", + " <script>\n", + " (function() {\n", + " const frame = document.getElementById(\"tensorboard-frame-83a6a03964d4187a\");\n", + " const url = new URL(\"/\", window.location);\n", + " const port = 6004;\n", + " if (port) {\n", + " url.port = port;\n", + " }\n", + " frame.src = url;\n", + " })();\n", + " </script>\n", + " " + ], + "text/plain": [ + "<IPython.core.display.HTML object>" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%load_ext tensorboard\n", + "! killall tensorboard\n", + "%tensorboard --port 6004 \\\n", + " --logdir_spec logs:{log_dir},logs0:{keras_fit_logs_spines_pdbc}" + ] + }, + { + "cell_type": "code", + "execution_count": 41, + "id": "a5b0da64", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 6 µs, sys: 1 µs, total: 7 µs\n", + "Wall time: 15.7 µs\n" + ] + } + ], + "source": [ + "%%time\n", + "\n", + "if TRAIN:\n", + " parser = trainer.train(\n", + " lr=0.00001,\n", + " epochs=50,\n", + " log_dir=log_dir,\n", + " model_dir=model_dir,\n", + " )" + ] + }, + { + "cell_type": "code", + "execution_count": 42, + "id": "e42b2bd4", + "metadata": {}, + "outputs": [], + "source": [ + "#import importlib\n", + "#from neural_parser import hybrid_tree_utils\n", + "#importlib.reload(hybrid_tree_utils)\n", + "#from neural_parser import data_utils\n", + "#importlib.reload(data_utils)\n", + "#from neural_parser import constituency_parser\n", + "#importlib.reload(constituency_parser)" + ] + }, + { + "cell_type": "code", + "execution_count": 43, + "id": "2f65dead", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "created 3 classifier(s)\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Some layers from the model checkpoint at models_spines_pdbc_compressed/model were not used when initializing TFBertForMultiTargetTokenClassification: ['dropout_73']\n", + "- This IS expected if you are initializing TFBertForMultiTargetTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n", + "- This IS NOT expected if you are initializing TFBertForMultiTargetTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n", + "All the layers of TFBertForMultiTargetTokenClassification were initialized from the model checkpoint at models_spines_pdbc_compressed/model.\n", + "If your task is similar to the task the model of the checkpoint was trained on, you can already use TFBertForMultiTargetTokenClassification for predictions without further training.\n" + ] + } + ], + "source": [ + "if not TRAIN:\n", + " from neural_parser import constituency_parser\n", + " parser = constituency_parser.ConstituencyParser.load(model_dir)" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "id": "24edee79", + "metadata": {}, + "outputs": [], + "source": [ + "sentences = [\n", + " 'Miał em kotka .',\n", + " 'Wlazł kotek na płotek i mruga .',\n", + "]" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "4a7cd10b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "1/1 [==============================] - 10s 10s/step\n" + ] + }, + { + "data": { + "text/plain": [ + "[(['Miał', 'em', 'kotka', '.'],\n", + " {'spines': ['ROOT_S_VP_V', '<EMPTY>', 'NP_N', 'Punct'],\n", + " 'anchors': ['<ROOT>', 'V', 'S', 'ROOT'],\n", + " 'anchor_hs': ['<ROOT>', '1', '1', '1']}),\n", + " (['Wlazł', 'kotek', 'na', 'płotek', 'i', 'mruga', '.'],\n", + " {'spines': ['VP_V',\n", + " 'NP_N',\n", + " 'PrepNP_Prep',\n", + " 'NP_N',\n", + " 'ROOT_S_VP_Conj',\n", + " 'VP_V',\n", + " 'Punct'],\n", + " 'anchors': ['VP', 'S', 'VP', 'PrepNP', '<ROOT>', 'VP', 'ROOT'],\n", + " 'anchor_hs': ['1', '1', '2', '1', '<ROOT>', '1', '1']})]" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "parser.parse(sentences)" + ] + }, + { + "cell_type": "markdown", + "id": "b814587d", + "metadata": {}, + "source": [ + "### Evaluation\n", + "\n", + "#### Hybrid" + ] + }, + { + "cell_type": "code", + "execution_count": 46, + "id": "4ac4b9df", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "<module 'neural_parser.constants' from '/home/kkrasnowska/neural-parsing/ICCS/neural_parser/constants.py'>" + ] + }, + "execution_count": 46, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from neural_parser import hybrid_tree_utils\n", + "importlib.reload(hybrid_tree_utils)\n", + "from neural_parser import constants\n", + "importlib.reload(constants)" + ] + }, + { + "cell_type": "code", + "execution_count": 47, + "id": "d1b28792", + "metadata": {}, + "outputs": [], + "source": [ + "from spacy import displacy\n", + "\n", + "def to_deps(tokens, deprels, heads):\n", + " deps = {'words' : [], 'arcs' : []}\n", + " for i, (token, deprel, head) in enumerate(zip(tokens, deprels, heads)):\n", + " deps['words'].append({'text' : token, 'tag' : 'X'})\n", + " if head >= 0:\n", + " d = 'left' if head > i else 'right'\n", + " start, end = sorted((i, head))\n", + " deps['arcs'].append({'start' : start, 'end' : end, 'label' : deprel, 'dir' : d})\n", + " return deps\n", + "\n", + "def display_deps(tokens, deprels, heads):\n", + " displacy.render(to_deps(tokens, deprels, heads), manual=True, options={'distance' : 80})\n", + " \n", + "import urllib.parse\n", + "import json\n", + "\n", + "def show_tree(tree):\n", + " tree_json = json.dumps(hybrid_tree_utils.tree2dict(tree)['tree'])\n", + " src = f'http://127.0.0.1:8010/?tree={urllib.parse.quote(tree_json)}'\n", + " display(IFrame(src, 950, 550))" + ] + }, + { + "cell_type": "code", + "execution_count": 48, + "id": "9f443569", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2211\n", + "2205\n", + "['Całuję', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'heads': [None, 0],\n", + " 'deprels': ['ROOT', 'punct'],\n", + " 'spines': ['ROOT_S_VP_V', 'Punct'],\n", + " 'anchors': ['<ROOT>', 'ROOT'],\n", + " 'anchor_hs': ['<ROOT>', '1']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['Drzemał', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'heads': [None, 0],\n", + " 'deprels': ['ROOT', 'punct'],\n", + " 'spines': ['ROOT_S_VP_V', 'Punct'],\n", + " 'anchors': ['<ROOT>', 'ROOT'],\n", + " 'anchor_hs': ['<ROOT>', '1']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "HDR = [\n", + " 'heads', 'deprels',\n", + " constants.SPINES, constants.ANCHORS, constants.ANCHOR_HS\n", + "]\n", + "\n", + "values = ['heads']\n", + "\n", + "def get_gold_data(dataset):\n", + " GOLD = []\n", + " for sent in dataset:\n", + " tokens = sent[constants.TOKENS]\n", + " tags = {\n", + " c : [dataset.features[c].feature.int2str(v) if c not in values else v for v in sent[c]]\n", + " for c in HDR\n", + " }\n", + " GOLD.append([tokens, tags])\n", + " GOLD = sorted(GOLD, key=lambda x: (len(x[0]), ''.join(x[0])))\n", + " print(len(GOLD))\n", + " TOKENS, TAGS = zip(*GOLD)\n", + " return TOKENS, TAGS\n", + "\n", + "TOKENS_VAL, TAGS_VAL = get_gold_data(TASK.dataset['validation'])\n", + "TOKENS_TEST, TAGS_TEST = get_gold_data(TASK.dataset['test'])\n", + "\n", + "print(TOKENS_VAL[0])\n", + "display(TAGS_VAL[0])\n", + "print(TOKENS_TEST[0])\n", + "display(TAGS_TEST[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 49, + "id": "3f53c039", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "70/70 [==============================] - 17s 152ms/step\n", + "69/69 [==============================] - 12s 168ms/step\n", + "['Całuję', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'spines': ['ROOT_S_VP_V', 'Punct'],\n", + " 'anchors': ['<ROOT>', 'ROOT'],\n", + " 'anchor_hs': ['<ROOT>', '1']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['Drzemał', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'spines': ['ROOT_S_VP_V', 'Punct'],\n", + " 'anchors': ['<ROOT>', 'ROOT'],\n", + " 'anchor_hs': ['<ROOT>', '1']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def get_predicted_data(TOKENS_TRUE):\n", + " PARSED = parser.parse([' '.join(toks) for toks in TOKENS_TRUE])\n", + " TOKENS, TAGS = zip(*PARSED)\n", + " try:\n", + " assert(TOKENS == TOKENS_TRUE)\n", + " except:\n", + " for tp, tt in zip(TOKENS, TOKENS_TRUE):\n", + " if tp != tt:\n", + " print(tp)\n", + " print(tt)\n", + " raise\n", + " return TOKENS, TAGS\n", + "\n", + "TOKENS_P_VAL, TAGS_P_VAL = get_predicted_data(TOKENS_VAL)\n", + "TOKENS_P_TEST, TAGS_P_TEST = get_predicted_data(TOKENS_TEST)\n", + "\n", + "print(TOKENS_P_VAL[0])\n", + "display(TAGS_P_VAL[0])\n", + "print(TOKENS_P_TEST[0])\n", + "display(TAGS_P_TEST[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 50, + "id": "17c1d9cb", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2211\n", + "2205\n", + "['Całuję', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'heads': [None, 0], 'deprels': ['root', 'punct']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['Drzemał', '.']\n" + ] + }, + { + "data": { + "text/plain": [ + "{'heads': [None, 0], 'deprels': ['root', 'punct']}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import conllu\n", + "\n", + "def get_combo_data(path):\n", + " fields = list(conllu.parser.DEFAULT_FIELDS)\n", + " fields[1] = 'token' \n", + " with open(path) as f:\n", + " x = conllu.parse(f.read(), fields=fields)\n", + " COMBO = []\n", + " for sent in x:\n", + " tokens = [tok['token'] for tok in sent]\n", + " heads = [tok['head'] - 1 if tok['head'] != 0 else None for tok in sent]\n", + " deprels = [tok['deprel'] for tok in sent]\n", + " COMBO.append([tokens, {'heads' : heads, 'deprels' : deprels}])\n", + "\n", + " COMBO = sorted(COMBO, key=lambda x: (len(x[0]), ''.join(x[0])))\n", + " print(len(COMBO))\n", + " TOKENS, TAGS = zip(*COMBO)\n", + " return TOKENS, TAGS\n", + "\n", + "TOKENS_C_VAL, TAGS_C_VAL = get_combo_data('COMBO/connlu/pdbc-validation-pred.conllu')\n", + "TOKENS_C_TEST, TAGS_C_TEST = get_combo_data('COMBO/connlu/pdbc-test-pred.conllu')\n", + "\n", + "assert(TOKENS_C_VAL == TOKENS_VAL)\n", + "assert(TOKENS_C_TEST == TOKENS_TEST)\n", + "\n", + "print(TOKENS_C_VAL[0])\n", + "display(TAGS_C_VAL[0])\n", + "print(TOKENS_C_TEST[0])\n", + "display(TAGS_C_TEST[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 51, + "id": "004918c6", + "metadata": {}, + "outputs": [], + "source": [ + "def _tree2spans(tree, spans, labeled=True, headed=False):\n", + " if headed and not labeled:\n", + " raise RuntimeError('cant’t use headed=True with labeled=False')\n", + " if not tree.children:\n", + " return {tree.from_index}\n", + " span = set()\n", + " for child in tree.children:\n", + " span.update(_tree2spans(child, spans, labeled, headed))\n", + " spans += [(tuple(sorted(span)), tree.category if labeled else 'SPAN', tree.is_head if headed else False)]\n", + " return span\n", + "\n", + "def tree2spans(tree, labeled=True, headed=False):\n", + " spans = []\n", + " _tree2spans(tree, spans, labeled=labeled, headed=headed)\n", + " # TODO\n", + " #try:\n", + " # assert(len(spans) == len(set(spans)))\n", + " #except:\n", + " # show_tree(tree)\n", + " # (display(spans))\n", + " # 1/0\n", + " return set(spans)" + ] + }, + { + "cell_type": "code", + "execution_count": 52, + "id": "65d493ca", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "<module 'neural_parser.hybrid_tree_utils' from '/home/kkrasnowska/neural-parsing/ICCS/neural_parser/hybrid_tree_utils.py'>" + ] + }, + "execution_count": 52, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from sklearn.metrics import precision_score, recall_score, f1_score, accuracy_score\n", + "\n", + "importlib.reload(hybrid_tree_utils)" + ] + }, + { + "cell_type": "code", + "execution_count": 53, + "id": "e5f88e76", + "metadata": { + "scrolled": false + }, + "outputs": [], + "source": [ + "ROOT = 'ROOT'\n", + "\n", + "def evaluate(tokens, tags_true, tags_pred, tags_combo, labeled=True, headed=False):\n", + "\n", + " P, R = [0, 0], [0, 0]\n", + " accuracies = {\n", + " key : {'true' : [], 'pred' : []} for key in ('heads', ('heads', 'deprels'))\n", + " }\n", + "\n", + " k = 0\n", + " i = 0\n", + " PROBLEM_TREES = []\n", + "\n", + " for toks, true, pred, combo in zip(tokens, tags_true, tags_pred, tags_combo):\n", + " \n", + " #sent = ' '.join(toks)\n", + " #cats = HDR\n", + " #true = dict(zip(cats, zip(*true)))\n", + " #pred = dict(zip(cats, zip(*pred)))\n", + " #print('----------------------------')\n", + " #print(sent)\n", + " dummy = {'lemmas' : ['_' for _ in toks], 'tags' : ['_' for _ in toks]}\n", + " true.update(dummy)\n", + " pred.update(dummy)\n", + " pred.update(combo)\n", + " try:\n", + " tree_true = hybrid_tree_utils.make_tree(toks, true, ROOT, decompress=True)\n", + " except:\n", + " print(toks)\n", + " display(true)\n", + " raise\n", + " try:\n", + " tree_pred = hybrid_tree_utils.make_tree(toks, pred, ROOT, decompress=True)\n", + " except:\n", + " print(toks)\n", + " display(pred)\n", + " print('=============================')\n", + " raise\n", + " tree_pred, problems = None, None\n", + " #if 'reattach' in problems:\n", + " # show_tree(tree_pred)\n", + " \n", + " #if pred['lemmas_corr'] != pred['lemmas']:\n", + " # print(pred['lemmas_corr'])\n", + " # print(pred['lemmas'])\n", + " \n", + " for key, v in accuracies.items():\n", + " if type(key) == str:\n", + " v['pred'] += [-1 if p is None else p for p in pred[key]]\n", + " v['true'] += [-1 if k is None else k for k in true[key]]\n", + " else:\n", + " v['pred'] += ['#'.join(map(str, x)) for x in zip(*(pred[kk] for kk in key))]\n", + " v['true'] += ['#'.join(map(str, x)) for x in zip(*(true[kk] for kk in key))]\n", + " \n", + " spans_true = tree2spans(tree_true, labeled=labeled, headed=headed)\n", + " spans_pred = tree2spans(tree_pred, labeled=labeled, headed=headed) if tree_pred else set()\n", + " if 'adwokata' in toks:\n", + " print(spans_true)\n", + " print(spans_pred)\n", + " tp = len(spans_true.intersection(spans_pred))\n", + " P[0] += tp\n", + " R[0] += tp\n", + " P[1] += len(spans_pred)\n", + " R[1] += len(spans_true)\n", + " leafs = tree_true.get_yield()\n", + " discont = [leaf.from_index for leaf in leafs] != list(range(len(leafs)))\n", + " #if k < 5 and len(toks) > 9 and [leaf.features['index'] for leaf in leafs] != list(range(len(leafs))):\n", + " #if k < 5 and spans_combo != spans_true:\n", + " #if k < 5 and not OK:\n", + " #if discont and len(toks) > 12 and k < 0 and spans_pred == spans_true:\n", + " if len(toks) == 8 and k < 0:\n", + " print('GOLD TREE:')\n", + " show_tree(tree_true)\n", + " display(true)\n", + " #display(_tree2dict(tree_true))\n", + " print('PREDICTED TREE:')\n", + " show_tree(tree_pred)\n", + " display(pred)\n", + " print('FP:', spans_pred - spans_true)\n", + " print('FN:', spans_true - spans_pred)\n", + " k += 1\n", + " i += 1\n", + " \n", + " p, r = P[0]/P[1], R[0]/R[1]\n", + " return {\n", + " 'P' : p, 'R': r, 'F1': (2 * p * r) / (p + r),\n", + " 'UAS' : accuracy_score(accuracies['heads']['true'], accuracies['heads']['pred']),\n", + " 'LAS' : accuracy_score(accuracies[('heads', 'deprels')]['true'], accuracies[('heads', 'deprels')]['pred']),\n", + " }" + ] + }, + { + "cell_type": "markdown", + "id": "df6a06fb", + "metadata": {}, + "source": [ + "0.9630140404796617\n", + "0.9605916493076027\n", + "0.9618013196384767\n", + "\n", + "– stare liczenie, bez kompresji, z tagami" + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "id": "8f8a771a", + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "unlabeled{((3,), 'SPAN', False), ((2, 3), 'SPAN', False), ((4,), 'SPAN', False), ((0, 1, 2, 3, 4), 'SPAN', False), ((0, 1, 2, 3), 'SPAN', False), ((2,), 'SPAN', False), ((0, 1), 'SPAN', False)}\n", + "{((3,), 'SPAN', False), ((2, 3), 'SPAN', False), ((4,), 'SPAN', False), ((0, 1, 2, 3, 4), 'SPAN', False), ((0, 1, 2, 3), 'SPAN', False), ((2,), 'SPAN', False), ((0, 1), 'SPAN', False)}\n", + "non-headed{((2,), 'Prep', False), ((4,), 'Punct', False), ((2, 3), 'PrepNP', False), ((3,), 'N', False), ((0, 1, 2, 3), 'S', False), ((0, 1), 'VP', False), ((0, 1), 'V', False), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False)}\n", + "{((2,), 'Prep', False), ((4,), 'Punct', False), ((2, 3), 'PrepNP', False), ((3,), 'N', False), ((0, 1, 2, 3), 'S', False), ((0, 1), 'VP', False), ((0, 1), 'V', False), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False)}\n", + "headed{((0, 1, 2, 3), 'S', True), ((4,), 'Punct', False), ((0, 1), 'VP', True), ((2, 3), 'PrepNP', False), ((0, 1), 'V', True), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False), ((2,), 'Prep', True), ((3,), 'N', True)}\n", + "{((0, 1, 2, 3), 'S', True), ((4,), 'Punct', False), ((0, 1), 'VP', True), ((2, 3), 'PrepNP', False), ((0, 1), 'V', True), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False), ((2,), 'Prep', True), ((3,), 'N', True)}\n" + ] + } + ], + "source": [ + "EVAL_DATA = {\n", + " '1val' : (TOKENS_VAL, TAGS_VAL, TAGS_P_VAL, TAGS_C_VAL),\n", + " '2test' : (TOKENS_TEST, TAGS_TEST, TAGS_P_TEST, TAGS_C_TEST),\n", + "}\n", + "EVAL_MODES = {\n", + " '1unlabeled' : {'labeled' : False, 'headed' : False},\n", + " '2non-headed' : {'labeled' : True, 'headed' : False},\n", + " '3headed' : {'labeled' : True, 'headed' : True},\n", + "}\n", + "\n", + "METRICS = ('P', 'R', 'F1')\n", + "\n", + "RESULTS = []\n", + "\n", + "tex = []\n", + "tex.append('\\\\toprule\\n')\n", + "tex.append('& \\\\multicolumn{3}{c}{validation} & \\\\multicolumn{3}{c}{test} \\\\\\\\\\n')\n", + "tex.append('& precision & recall & F1 & precision & recall & F1 \\\\\\\\\\n')\n", + "tex.append('\\\\midrule\\n')\n", + "for mode_name, mode in sorted(EVAL_MODES.items()):\n", + " print(mode_name[1:], end='')\n", + " tex.append(mode_name)\n", + " for data_name, data in sorted(EVAL_DATA.items()):\n", + " evaluation = evaluate(*data, **mode)\n", + " for metric in METRICS:\n", + " tex.append(f' & {100 * evaluation[metric]:.2f}\\\\%')\n", + " RESULTS.append((data_name, mode_name, metric, evaluation[metric]))\n", + " tex.append(' \\\\\\\\\\n')\n", + "tex.append('\\\\bottomrule\\n')" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "63192852", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "78250b1b", + "metadata": {}, + "outputs": [], + "source": [ + "rows = set((r[0][1:], r[1][1:] if r[2] in ('P', 'R', 'F1') else '-', r[2], r[3]) for r in RESULTS)" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "id": "bba6ed15", + "metadata": {}, + "outputs": [], + "source": [ + "results = pd.DataFrame(data=rows, columns=['dataset', 'measure_type', 'measure', 'value'])" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "543377f8", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th>dataset</th>\n", + " <th>measure_type</th>\n", + " <th>measure</th>\n", + " <th>value</th>\n", + " </tr>\n", + " <tr>\n", + " <th>dataset</th>\n", + " <th>measure</th>\n", + " <th>measure_type</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"9\" valign=\"top\">test</th>\n", + " <th rowspan=\"3\" valign=\"top\">F1</th>\n", + " <th>headed</th>\n", + " <th>7</th>\n", + " <td>test</td>\n", + " <td>headed</td>\n", + " <td>F1</td>\n", + " <td>0.959192</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>8</th>\n", + " <td>test</td>\n", + " <td>non-headed</td>\n", + " <td>F1</td>\n", + " <td>0.965236</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>15</th>\n", + " <td>test</td>\n", + " <td>unlabeled</td>\n", + " <td>F1</td>\n", + " <td>0.964436</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">P</th>\n", + " <th>headed</th>\n", + " <th>9</th>\n", + " <td>test</td>\n", + " <td>headed</td>\n", + " <td>P</td>\n", + " <td>0.959611</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>6</th>\n", + " <td>test</td>\n", + " <td>non-headed</td>\n", + " <td>P</td>\n", + " <td>0.965658</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>13</th>\n", + " <td>test</td>\n", + " <td>unlabeled</td>\n", + " <td>P</td>\n", + " <td>0.964118</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">R</th>\n", + " <th>headed</th>\n", + " <th>2</th>\n", + " <td>test</td>\n", + " <td>headed</td>\n", + " <td>R</td>\n", + " <td>0.958773</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>5</th>\n", + " <td>test</td>\n", + " <td>non-headed</td>\n", + " <td>R</td>\n", + " <td>0.964815</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>0</th>\n", + " <td>test</td>\n", + " <td>unlabeled</td>\n", + " <td>R</td>\n", + " <td>0.964754</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"9\" valign=\"top\">val</th>\n", + " <th rowspan=\"3\" valign=\"top\">F1</th>\n", + " <th>headed</th>\n", + " <th>14</th>\n", + " <td>val</td>\n", + " <td>headed</td>\n", + " <td>F1</td>\n", + " <td>0.957423</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>4</th>\n", + " <td>val</td>\n", + " <td>non-headed</td>\n", + " <td>F1</td>\n", + " <td>0.963231</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>1</th>\n", + " <td>val</td>\n", + " <td>unlabeled</td>\n", + " <td>F1</td>\n", + " <td>0.962553</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">P</th>\n", + " <th>headed</th>\n", + " <th>10</th>\n", + " <td>val</td>\n", + " <td>headed</td>\n", + " <td>P</td>\n", + " <td>0.958145</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>16</th>\n", + " <td>val</td>\n", + " <td>non-headed</td>\n", + " <td>P</td>\n", + " <td>0.963958</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>11</th>\n", + " <td>val</td>\n", + " <td>unlabeled</td>\n", + " <td>P</td>\n", + " <td>0.962762</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">R</th>\n", + " <th>headed</th>\n", + " <th>17</th>\n", + " <td>val</td>\n", + " <td>headed</td>\n", + " <td>R</td>\n", + " <td>0.956702</td>\n", + " </tr>\n", + " <tr>\n", + " <th>non-headed</th>\n", + " <th>12</th>\n", + " <td>val</td>\n", + " <td>non-headed</td>\n", + " <td>R</td>\n", + " <td>0.962505</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unlabeled</th>\n", + " <th>3</th>\n", + " <td>val</td>\n", + " <td>unlabeled</td>\n", + " <td>R</td>\n", + " <td>0.962343</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " dataset measure_type measure value\n", + "dataset measure measure_type \n", + "test F1 headed 7 test headed F1 0.959192\n", + " non-headed 8 test non-headed F1 0.965236\n", + " unlabeled 15 test unlabeled F1 0.964436\n", + " P headed 9 test headed P 0.959611\n", + " non-headed 6 test non-headed P 0.965658\n", + " unlabeled 13 test unlabeled P 0.964118\n", + " R headed 2 test headed R 0.958773\n", + " non-headed 5 test non-headed R 0.964815\n", + " unlabeled 0 test unlabeled R 0.964754\n", + "val F1 headed 14 val headed F1 0.957423\n", + " non-headed 4 val non-headed F1 0.963231\n", + " unlabeled 1 val unlabeled F1 0.962553\n", + " P headed 10 val headed P 0.958145\n", + " non-headed 16 val non-headed P 0.963958\n", + " unlabeled 11 val unlabeled P 0.962762\n", + " R headed 17 val headed R 0.956702\n", + " non-headed 12 val non-headed R 0.962505\n", + " unlabeled 3 val unlabeled R 0.962343" + ] + }, + "execution_count": 58, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results.groupby(['dataset', 'measure', 'measure_type'], group_keys=True).apply(lambda x: x)" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "id": "0b5d3fe4", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\\toprule\n", + "& \\multicolumn{3}{c}{validation} & \\multicolumn{3}{c}{test} \\\\\n", + "& precision & recall & F1 & precision & recall & F1 \\\\\n", + "\\midrule\n", + "1unlabeled & 96.28\\% & 96.23\\% & 96.26\\% & 96.41\\% & 96.48\\% & 96.44\\% \\\\\n", + "2non-headed & 96.40\\% & 96.25\\% & 96.32\\% & 96.57\\% & 96.48\\% & 96.52\\% \\\\\n", + "3headed & 95.81\\% & 95.67\\% & 95.74\\% & 95.96\\% & 95.88\\% & 95.92\\% \\\\\n", + "\\bottomrule\n" + ] + } + ], + "source": [ + "for t in tex:\n", + " print(t, end='')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7946f27c", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3ff86ee7", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "378cc977", + "metadata": {}, + "outputs": [], + "source": [ + "def evaluate_spines(tags_true, tags_pred):\n", + "\n", + " TRUE, PRED = [], []\n", + " values = set()\n", + "\n", + " for true, pred in zip(tags_true, tags_pred):\n", + " t, p = true['spines'], pred['spines']\n", + " TRUE += t\n", + " PRED += p\n", + " values.update(t + p)\n", + " \n", + " print('ACCURACY:', accuracy_score(TRUE, PRED))\n", + " \n", + " values = sorted(values)\n", + " ct = Counter(TRUE)\n", + " cp = Counter(PRED)\n", + " precisions = precision_score(TRUE, PRED, average=None)\n", + " recalls = recall_score(TRUE, PRED, average=None)\n", + " f1s = f1_score(TRUE, PRED, average=None)\n", + " #for v, p, r, f in sorted(zip(values, precisions, recalls, f1s), key=lambda x: -x[3]):\n", + " # if v.endswith('formarzecz') or v.endswith('formaczas'):\n", + " # spine = ' $\\\\rightarrow$ '.join(f'\\\\nt{{{n}}}' for n in v.split('_'))\n", + " # print(f'{spine} & {100 * p:.2f}\\\\% & {100 * r:.2f}\\\\% & {100 * f:.2f}\\\\% \\\\\\\\')\n", + " \n", + " ct_pre, cp_pre = Counter(), Counter()\n", + " for val in values:\n", + " pre = val.split('_')[-1]\n", + " ct_pre[pre] += ct[val]\n", + " cp_pre[pre] += cp[val]\n", + " \n", + " rows = []\n", + " \n", + " for pre in ct_pre.keys():\n", + " # TODO\n", + " if pre == 'ign':\n", + " continue\n", + " if not cp_pre[pre] * ct_pre[pre]:\n", + " print('SKIPPING:', pre)\n", + " continue\n", + " P, R = 0, 0\n", + " rws = []\n", + " for v, p, r, f in sorted(zip(values, precisions, recalls, f1s), key=lambda x: -x[3]):\n", + " if v.endswith(pre):\n", + " if pre in ('N', 'V',):\n", + " spine = ' $\\\\rightarrow$ '.join(f'\\\\nt{{{n}}}' for n in v.split('_'))\n", + " rws.append(f'{spine} & {100 * p:.2f}\\\\% & {100 * r:.2f}\\\\% & {100 * f:.2f}\\\\% & {ct[v]} \\\\\\\\')\n", + " wp, wr = cp[v] / cp_pre[pre], ct[v] / ct_pre[pre]\n", + " #print(f' {v:36s} {100 * p:6.2f} {wp:7.3f} {100 * r:6.2f} {wr:7.3f}')\n", + " P += p * wp\n", + " R += r * wr\n", + " F = 2 * P * R / (P + R)\n", + " if pre in ('N', 'V',):\n", + " rws.append('\\\\midrule')\n", + " spine = f'... $\\\\rightarrow$ \\\\nt{{{pre}}}'\n", + " rws = [f'{spine} & {100 * P:6.2f}\\\\% & {100 * R:6.2f}\\\\% & {100 * F:6.2f}\\\\% & {ct_pre[pre]} \\\\\\\\', '\\\\midrule'] + rws\n", + " rows.append([-F, rws])\n", + " \n", + " for _, rws in sorted(rows):\n", + " for r in rws:\n", + " print(r)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "79a535ee", + "metadata": { + "scrolled": true + }, + "outputs": [], + "source": [ + "evaluate_spines(TAGS_VAL, TAGS_P_VAL)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ff572777", + "metadata": {}, + "outputs": [], + "source": [ + "evaluate_spines(TAGS_TEST, TAGS_P_TEST)" + ] + }, + { + "cell_type": "markdown", + "id": "a7784f94", + "metadata": {}, + "source": [ + "pdbc_hybrid2: cały path (łącznie z powtórzeniamia )+ który <anchor> od dołu:\n", + "\n", + "P: 0.9554150435214833\n", + "R: 0.952102292362631\n", + "F1: 0.9537557913442842" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "TF_zajecia", + "language": "python", + "name": "tf_zajecia" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.6" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git b/neural_parser/MultiTarget.py a/neural_parser/MultiTarget.py new file mode 100644 index 0000000..79d7553 --- /dev/null +++ a/neural_parser/MultiTarget.py @@ -0,0 +1,89 @@ +import tensorflow as tf + +from transformers import TFBertPreTrainedModel, BertConfig, TFBertMainLayer +from transformers.modeling_tf_utils import get_initializer, input_processing, TFTokenClassificationLoss + +class TFBertForMultiTargetTokenClassification(TFBertPreTrainedModel, TFTokenClassificationLoss): + # names with a '.' represents the authorized unexpected/missing layers when a TF model is loaded from a PT model + _keys_to_ignore_on_load_unexpected = [ + r"pooler", + r"mlm___cls", + r"nsp___cls", + r"cls.predictions", + r"cls.seq_relationship", + ] + _keys_to_ignore_on_load_missing = [r"dropout"] + + def __init__(self, config: BertConfig, *inputs, **kwargs): + + categories = kwargs.pop('categories') + labels = kwargs.pop('labels') + + super().__init__(config, *inputs, **kwargs) + + self.categories = categories + + self.bert = TFBertMainLayer(config, add_pooling_layer=False, name="bert") + classifier_dropout = ( + config.classifier_dropout if config.classifier_dropout is not None else config.hidden_dropout_prob + ) + self.dropout = tf.keras.layers.Dropout(rate=classifier_dropout) + self.classifiers = [ + tf.keras.layers.Dense( + units=len(labels[cat]), + kernel_initializer=get_initializer(config.initializer_range), + name=f'classifier_{cat}', + ) for cat in self.categories + ] + print(f'created {len(self.classifiers)} classifier(s)') + + def call( + self, + input_ids=None, + attention_mask=None, + token_type_ids=None, + position_ids=None, + head_mask=None, + inputs_embeds=None, + output_attentions=None, + output_hidden_states=None, + return_dict=None, + labels=None, + training=False, + **kwargs, + ): + inputs = input_processing( + func=self.call, + config=self.config, + input_ids=input_ids, + attention_mask=attention_mask, + token_type_ids=token_type_ids, + position_ids=position_ids, + head_mask=head_mask, + inputs_embeds=inputs_embeds, + output_attentions=output_attentions, + output_hidden_states=output_hidden_states, + return_dict=return_dict, + labels=labels, + training=training, + kwargs_call=kwargs, + ) + outputs = self.bert( + input_ids=inputs["input_ids"], + attention_mask=inputs["attention_mask"], + token_type_ids=inputs["token_type_ids"], + position_ids=inputs["position_ids"], + head_mask=inputs["head_mask"], + inputs_embeds=inputs["inputs_embeds"], + output_attentions=inputs["output_attentions"], + output_hidden_states=inputs["output_hidden_states"], + return_dict=inputs["return_dict"], + training=inputs["training"], + ) + sequence_output = outputs[0] + sequence_output = self.dropout(inputs=sequence_output, training=inputs["training"]) + logits = [classifier(inputs=sequence_output) for classifier in self.classifiers] + return dict(zip(self.categories, logits)) + + def serving_output(self, output): + return output diff --git b/neural_parser/constants.py a/neural_parser/constants.py new file mode 100644 index 0000000..a4ab88d --- /dev/null +++ a/neural_parser/constants.py @@ -0,0 +1,15 @@ +MASK_VALUE = -100 + +FIRST = 'first' +LAST = 'last' + +EMPTY = '<EMPTY>' + +TOKENS = 'tokens' +LEMMAS = 'lemmas' +TAGS = 'tags' +SPINES = 'spines' +ANCHORS = 'anchors' +ANCHOR_HS = 'anchor_hs' +HEADS = 'heads' +DEPRELS = 'deprels' diff --git b/neural_parser/constituency_parser.py a/neural_parser/constituency_parser.py new file mode 100644 index 0000000..a73efe4 --- /dev/null +++ a/neural_parser/constituency_parser.py @@ -0,0 +1,139 @@ +import json + +import morfeusz2 + +import tensorflow as tf +from transformers import AutoTokenizer + +from datasets.features import ClassLabel, Sequence + +from .data_utils import dict_to_tensors +from .dataset_utils import masked_word_ids +from .MultiTarget import TFBertForMultiTargetTokenClassification + +from .constants import ( + SPINES, + ANCHORS, + ANCHOR_HS, +) + +def maybe_int(s): + if s and (s.isdigit() or s[0] == '-' and s[1:].isdigit()): + return int(s) + return s + +def keys_hook(d): + return { maybe_int(k) : v for k, v in d.items() } + +def get_labels(features, categories): + labels = {} + for cat in categories: + feature = features[cat].feature + if type(feature) == ClassLabel: + labels[cat] = feature.names + return labels + +class ConstituencyParser(object): + + def __init__( + self, + bert_path, + model, + labels, + bert_tokenizer=None, + ): + self.bert_path = bert_path + self.model = model + self.categories = [SPINES, ANCHORS, ANCHOR_HS] + self.labels = labels + if bert_tokenizer is not None: + self.bert_tokenizer = bert_tokenizer + else: + self.bert_tokenizer = AutoTokenizer.from_pretrained(bert_path) + self.morfeusz = morfeusz2.Morfeusz(generate=False, expand_tags=True) + + def save(self, path): + self.model.save_pretrained(f'{path}/model') + config = { + 'labels' : self.labels, + 'bert_path' : self.bert_path, + } + with open(f'{path}/config.json', 'w') as f: + json.dump(config, f, ensure_ascii=False) + + def create( + bert_path, + features, + bert_tokenizer=None, + ): + categories = [SPINES, ANCHORS, ANCHOR_HS] + labels = get_labels(features, categories) + model = TFBertForMultiTargetTokenClassification.from_pretrained( + bert_path, + from_pt=True, + categories=categories, + labels=labels, + ) + return ConstituencyParser( + bert_path, + model, + labels, + bert_tokenizer=bert_tokenizer + ) + + def load(path): + with open(f'{path}/config.json') as f: + config = json.load(f, object_hook=keys_hook) + labels = config['labels'] + bert_path = config['bert_path'] + categories = [SPINES, ANCHORS, ANCHOR_HS] + model = TFBertForMultiTargetTokenClassification.from_pretrained( + f'{path}/model', + categories=categories, + labels=labels, + ) + return ConstituencyParser( + bert_path, + model, + labels, + ) + + def align_with_mask(self, labels, mask): + return [ + lbl if not hasattr(lbl, '__iter__') or type(lbl) == str else self.align_with_mask(lbl, mask) + for lbl, m in zip(labels, mask) if m is not None + ] + + def parse(self, sentences, force_long=False): + + if isinstance(sentences, str): + sentences = [sentences] + tokens = [s.split() for s in sentences] + tokenized = self.bert_tokenizer( + tokens, + is_split_into_words=True, + return_offsets_mapping=True, + padding=True, + ) + + M = len(tokenized['input_ids'][0]) + if M > self.bert_tokenizer.model_max_length and not force_long: + raise RuntimeError(f'Bert tokenizer produced a sequence of {M} tokens which exceeds the model’s limit ({self.bert_tokenizer.model_max_length}). Parse shorter sentences or call parse with force_long=True at your own risk.') + x = dict_to_tensors(dict(tokenized)) + + predicted = self.model.predict(x) + labels = dict() + for cat, pred in predicted.items(): + label_ids = tf.argmax(pred, axis=-1).numpy() + lbls = [[self.labels[cat][i] for i in l_ids] for l_ids in label_ids] + labels[cat] = lbls + + trees = [] + + for i, (tkns, sentence) in enumerate(zip(tokens, sentences)): + + mask = masked_word_ids(tokenized.word_ids(i)) + lbls = {cat : self.align_with_mask(lbls[i], mask) for cat, lbls in labels.items()} + trees.append((tkns, lbls)) + + return trees diff --git b/neural_parser/data_utils.py a/neural_parser/data_utils.py new file mode 100644 index 0000000..6452ab0 --- /dev/null +++ a/neural_parser/data_utils.py @@ -0,0 +1,41 @@ +from collections import defaultdict +from itertools import chain + +import numpy as np +import tensorflow as tf + +from datasets.features import ClassLabel + +from .constants import MASK_VALUE + +# based on tensorflow.data.data_collator.DataCollatorForTokenClassification +class DataCollator(object): + + def __init__(self, tokenizer, features): + self.tokenizer = tokenizer + self.features = features + + def _pad_labels(self, labels, sequence_length): + if self.tokenizer.padding_side == 'right': + return list(labels) + [MASK_VALUE] * (sequence_length - len(labels)) + else: + return [MASK_VALUE] * (sequence_length - len(labels)) + list(labels) + + def __call__(self, instance): + + batch = self.tokenizer.pad( + instance, + padding=True, + ) + sequence_length = tf.convert_to_tensor(batch['input_ids']).shape[1] + for category, feat in self.features.items(): + if type(feat.feature) == ClassLabel: + padded_labels = [self._pad_labels(lbl, sequence_length) for lbl in batch[category]] + batch[category] = padded_labels + else: + raise ValueError(f'Unsupported feature type {type(feat.feature)} for "{category}".') + batch = {k: tf.convert_to_tensor(v) for k, v in batch.items()} + return batch + +def dict_to_tensors(d): + return { k : tf.convert_to_tensor(v) for k, v in d.items() } diff --git b/neural_parser/dataset_utils.py a/neural_parser/dataset_utils.py new file mode 100644 index 0000000..8917060 --- /dev/null +++ a/neural_parser/dataset_utils.py @@ -0,0 +1,138 @@ +from collections import Counter, defaultdict +from itertools import chain + +from datasets import ClassLabel, Sequence + +from .hybrid_tree_utils import tree_from_dataset_instance + +from .constants import ( + FIRST, + LAST, + MASK_VALUE, + EMPTY, + TOKENS, + SPINES, + ANCHORS, + ANCHOR_HS, +) + +def _do_collect_spines(tree): + if not tree.children: + return [tree], [] + heads = [child for child in tree.children if child.is_head] + assert(len(heads) == 1) + head = heads[0] + paths = [] + my_path = [tree] + non_heads = [] + for child in tree.children: + child_path, grandchildren_paths = _do_collect_spines(child) + paths += grandchildren_paths + if child == head: + my_path += child_path + else: + non_heads.append(child_path) + for child_path in non_heads: + # h == which <tree.category> counting from the bottom is the anchor + h = [n.category for n in my_path].count(tree.category) + paths.append((tree.category, h, child_path)) + return my_path, paths + +def _collect_spines(tree): + try: + path, paths = _do_collect_spines(tree) + except: + print(tree.to_brackets()) + raise + return {p[-1] : (anchor, h, p[:-1]) for anchor, h, p in [('<ROOT>', '<ROOT>', path)] + paths} + +def _compress_spine(spine): + compressed = [] + for category in spine: + if category in compressed: + assert(category == compressed[-1]) + else: + compressed.append(category) + return compressed + +def _add_spines_and_attachments(instance, dataset_features, compress): + tree = tree_from_dataset_instance(instance, dataset_features) + spines = _collect_spines(tree) + leafs_linear = sorted(tree.get_yield(), key=lambda leaf: leaf.from_index) + rows = [] + for leaf in leafs_linear: + anchor, anchor_h, spine = spines[leaf] + spine = [node.category for node in spine] + if compress: + spine = _compress_spine(spine) + spine = '_'.join(spine) if spine else EMPTY + rows.append((spine, anchor, str(anchor_h))) + spines, anchors, anchor_hs = zip(*rows) + return { + SPINES : spines, + ANCHORS : anchors, + ANCHOR_HS : anchor_hs, + } + +def cast_labels(dataset, columns): + vals = defaultdict(Counter) + for d in dataset.values(): + for column in columns: + vals[column].update(chain.from_iterable(s[column] for s in d)) + new_features = dataset['train'].features.copy() + for column in columns: + new_features[column] = Sequence(ClassLabel(names=sorted(vals[column].keys()))) + return dataset.cast(new_features) + +def add_spines_and_attachments(dataset, compress=False): + dataset_features = dataset['train'].features + new_dataset = dataset.map(lambda instance: _add_spines_and_attachments(instance, dataset_features, compress=compress)) + return cast_labels(new_dataset, [SPINES, ANCHORS, ANCHOR_HS]) + +# https://huggingface.co/docs/transformers/v4.23.1/en/tasks/token_classification + +def masked_word_ids(word_ids, masking_strategy=FIRST): + masked = [] + for i, word_idx in enumerate(word_ids): + # Set the label for the first/last token of each word. + # Mask the label for: + # * special tokens (word id = None) + # * other tokens in a word + if word_idx is None: + masked.append(None) + else: + if masking_strategy == FIRST: + masked.append(word_idx if word_idx != word_ids[i - 1] else None) + elif masking_strategy == LAST: + masked.append(word_idx if word_idx != word_ids[i + 1] else None) + return masked + +def _align_row(values, masked_word_ids): + return [MASK_VALUE if idx is None else values[idx] for idx in masked_word_ids] + +def _align_example(example, masked_ids): + + column_names = list(example.keys()) + labels = defaultdict(list) + masked_row = [MASK_VALUE for x in masked_ids] + + for column_name in column_names: + if column_name not in (SPINES, ANCHORS, ANCHOR_HS): + continue + values = example[column_name] + aligned_labels = _align_row(example[column_name], masked_ids) + labels[column_name] = aligned_labels + + return labels + +def bert_tokenize_and_align(example, tokenizer, masking_strategy=FIRST): + + if masking_strategy not in (FIRST, LAST): + raise RuntimeError(f'Uknown masking strategy: {masking_strategy}') + + tokenized_inputs = tokenizer(example[TOKENS], truncation=True, is_split_into_words=True) + word_ids = tokenized_inputs.word_ids() + mask = masked_word_ids(word_ids, masking_strategy) + labels = _align_example(example, mask) + tokenized_inputs.update(labels) + return tokenized_inputs diff --git b/neural_parser/hybrid_tree_utils.py a/neural_parser/hybrid_tree_utils.py new file mode 100644 index 0000000..4b88bcb --- /dev/null +++ a/neural_parser/hybrid_tree_utils.py @@ -0,0 +1,335 @@ +from collections import defaultdict +from itertools import chain + +from .constants import ( + EMPTY, + TOKENS, + LEMMAS, + TAGS, + SPINES, + ANCHORS, + ANCHOR_HS, + HEADS, + DEPRELS, +) + +class TreeNode(object): + + def __init__(self, nid, category, is_head, from_index, to_index, head_index=None, deprel=None, attributes=None, children=None): + self.nid = nid + self.parent = None + self.category = category + self.is_head = is_head + self.from_index = from_index + self.to_index = to_index + self.head_index = head_index + self.deprel = deprel + self.attributes = attributes if attributes is not None else {} + self.children = children if children is not None else [] + for child in self.children: + child.parent = self + + def add_child(self, child): + self.children.append(child) + child.parent = self + + def get_yield(self): + if not self.children: + return [self] + return list(chain.from_iterable(child.get_yield() for child in self.children)) + + def is_continuous(self): + idx = [token.from_index for token in self.get_yield()] + return (idx == sorted(idx)) + + def get_root(self): + root = self + while root.parent is not None: + root = root.parent + return root + + def get_head_child(self): + if tree.children: + heads = [child for child in tree.children if child.is_head] + assert(len(heads) == 1) + return heads[0] + return None + + def get_head_token(self): + while tree.children: + tree = tree.get_head_child + return tree + + def make_evalb_friendly(self, s): + return s.replace(' ', '_').replace('(', 'LPAR').replace(')', 'RPAR') + + def to_brackets(self, features=[], mark_head=True, mark_head_terminals=False, morph_tags=False, dummy_pre=False): + if mark_head_terminals: + raise NotImplementedError + if not self.children: + cat = self.make_evalb_friendly(self.category[0]) + if morph_tags: + cat = f'({self.category[2]} {cat})' + #if mark_head_terminals and self.is_head: + # cat = '*' + cat + if len(self.parent.children) == 1 or not dummy_pre: + return cat + else: + return f'(DUMMY_PRE {cat})' + else: + cat = '_'.join([self.category] + [self.attributes.get(f, EMPTY_VAL) for f in features]) + if mark_head and self.is_head: + cat = '*' + cat + cat = self.make_evalb_friendly(cat) + return f'({cat} {" ".join(child.to_brackets(features=features, mark_head=mark_head, mark_head_terminals=mark_head_terminals, morph_tags=morph_tags, dummy_pre=dummy_pre) for child in self.children)})' + + def pretty_print(self, tab='', features=[]): + print(f'{tab}[{self.nid}] {"*" if self.is_head else ""}{self.category}{[self.attributes.get(f, EMPTY_VAL) for f in features]}') + for child in self.children: + child.pretty_print(tab=tab + ' ', features=features) + +def _do_mark_heads(tree, dependency_heads): + if not tree.children: + return tree.from_index + child_head_idx = [_do_mark_heads(child, dependency_heads) for child in tree.children] + heads = [] + for child, child_head_id in zip(tree.children, child_head_idx): + if dependency_heads[child_head_id] not in child_head_idx: + child.is_head = True + heads.append(child_head_id) + assert(len(heads) == 1) + return heads[0] + +def _mark_heads(tree, dependency_heads): + _do_mark_heads(tree, dependency_heads) + +def _rearrange(tree): + if tree.children: + children = [_rearrange(child) for child in tree.children] + tree.children = sorted(children, key=lambda child: child.from_index) + tree.from_index = tree.children[0].from_index + tree.to_index = max(child.to_index for child in tree.children) + return tree + +def tree_from_dataset_instance(instance, dataset_features): + nonterminals = instance['nonterminals'] + nodes = [] + + # create a node for each nonterminal + for i, nonterminal in enumerate(nonterminals): + category = nonterminal['cat'] + if category is None: + assert(len(nonterminal['children']) == 1) + token_idx = nonterminal['children'][0] + orth = instance[TOKENS][token_idx] + lemma = instance[LEMMAS][token_idx] + tag = dataset_features[TAGS].feature.int2str(instance[TAGS][token_idx]) + category = (orth, lemma, tag) + nodes.append(TreeNode(i, category, False, token_idx, token_idx + 1)) + else: + nodes.append(TreeNode(i, category, False, 0, 0)) + + # link the nodes with parent-head relations + for nonterminal, dupa in list(zip(nonterminals, nodes)): + if nonterminal['cat'] is not None: + for child_idx in nonterminal['children']: + dupa.add_child(nodes[child_idx]) + + tree = nodes[0] + # mark the heads according to dependency relations + _mark_heads(tree, instance['heads']) + + return _rearrange(tree) + +def get_heads(matrix): + chart_n = normalize(matrix) + chart_r = add_root(chart_n) + heads = {dep - 1: hd - 1 for hd, dep in mst(chart_r) if dep > 0} + return [hd for dep, hd in sorted(heads.items())] + +def make_head_path(path, token, lemma, tag, index): + node = TreeNode(0, (token, lemma, tag), False, index, index + 1) + if path == EMPTY: + return node + for cat in reversed(path.split('_')): + node.is_head = True + node = TreeNode(0, cat, False, None, None, children=[node]) + return node + +def append_dependent(head_path, dep_path, anchor_cat, anchor_h, decompress=False): + problem = None + anchor_node = head_path + head_chain = [head_path] + while head_chain[-1].children: + heads = [child for child in head_chain[-1].children if child.is_head] + try: + assert len(heads) == 1 + head_chain.append(heads[0]) + except: + head_path.pretty_print() + head_chain[-1].pretty_print() + raise + matching_heads = [hd for hd in head_chain if hd.category == anchor_cat] + if not matching_heads: + anchor_node = head_path + problem = (dep_path, anchor_cat) + else: + # fallback: take the highest + if anchor_h is None: + anchor_h = len(matching_heads) + elif anchor_h > len(matching_heads) and not decompress: + anchor_h = len(matching_heads) + elif anchor_h > len(matching_heads) and decompress: + expand = anchor_h - len(matching_heads) + for i in range(expand): + child = matching_heads[0] + parent = child.parent + new_node = TreeNode(0, anchor_cat, child.is_head, None, None, children=[child]) + child.is_head = True + if parent: + parent.children.remove(child) + parent.add_child(new_node) + if head_path == child: + head_path = new_node + matching_heads.insert(0, new_node) + anchor_node = matching_heads[-anchor_h] + anchor_node.add_child(dep_path) + dep_path.is_head = False + return head_path, problem + +POS2PRE = { + #'aglt' : 'aglt', + #'conj' : 'spójnik', + #'dig' : 'formalicz', + #'fin' : 'formaczas', + #'interp' : 'punct', + #'num' : 'formalicz', + #'praet' : 'formaczas', + #'_' : '???', +} + +def add_dummy_pre(path): + pos = path.category[2].split(':')[0] + return TreeNode(0, f'{POS2PRE[pos]}', True, {}, [path]) + +def check_no_cycles(heads): + children_dict = defaultdict(set) + for i, hd in enumerate(heads): + children_dict[hd].add(i) + visited = {-1} + queue = [-1] + while queue: + children = children_dict.pop(queue[0], set()) + if children.intersection(visited): + return False + visited.update(children) + queue = queue[1:] + list(children) + return not children + +# find any <EMPTY>’s children and reattach them to <EMPTY>’s head +def try_reattach(heads, spines, tokens): + + to_reattach = [i for i, spine in enumerate(spines) if spine == EMPTY and i in heads] + k = 0 + while to_reattach: + k += 1 + if k == 50: + 1/0 + print('------- TO REATTACH:') + for i in to_reattach: + print(' ===>', i, tokens[i], '->', [t for t, h in zip(tokens, heads) if h == i]) + tr = to_reattach[0] + hd_idx = heads[tr] + assert(hd_idx is not None) + new_heads = heads.copy() + for i, hd in enumerate(heads): + if hd == tr: + new_heads[i] = hd_idx + if check_no_cycles(new_heads): + heads = new_heads + else: + print('can’t reattach (cycle!)') + 1/0 + to_reattach = [i for i, spine in enumerate(spines) if spine == EMPTY and i in heads] + + return heads + +def reconstruct_tree(tokens, tags, decompress=False, root_label='ROOT'): + morph_tags = tags.get(TAGS, ['_' for _ in tokens]) + lemmas = tags.get(LEMMAS, ['_' for _ in tokens]) + heads = tags[HEADS] + deprels = tags[DEPRELS] + spines = tags[SPINES] + anchors = tags[ANCHORS] + anchor_hs = tags[ANCHOR_HS] + problems = [] + spines = list(spines) + children = defaultdict(set) + + for i, (head, spine) in enumerate(zip(heads, spines)): + if (head is None and root_label not in spine): + spines[i] = (f'{root_label}_' + spines[i]).replace(f'_{EMPTY}', '') + if (head is not None and root_label in spine): + assert(spines[i].startswith(root_label)) + spines[i] = EMPTY if spines[i] == root_label else spines[i].replace(f'{root_label}_', '') + + reattach = False + + new_heads = try_reattach(heads, spines, tokens) + if new_heads != heads: + heads = new_heads + reattach = True + + head_paths = [ + make_head_path(p, tok, lemma, tag, i) for i, (p, tok, lemma, tag) + in enumerate(zip(spines, tokens, lemmas, morph_tags)) + ] + + # if a spine is some other spine’s head and consists of a terminal only, add a dummy preterminal to append to + head_paths = [add_dummy_pre(hp) if (type(hp.category) == tuple and i in heads) else hp for i, hp in enumerate(head_paths)] + + anchor_hs = [int(h) if h != '<ROOT>' else None for h in anchor_hs] + root = None + for i, head in enumerate(heads): + if deprels[i] is not None: + head_paths[i].attributes['deprel'] = deprels[i] + if head is None: + root = i + else: + head_paths[head], problem = append_dependent( + head_paths[head], head_paths[i], anchors[i], anchor_hs[i], decompress=decompress) + if problem: + problems.append(problem) + if reattach: + problems.append('reattach') + + tree = _rearrange(head_paths[root]) + + return tree, problems + +def make_tree(tokens, tags, root_label, decompress=True): + tree, problems = reconstruct_tree(tokens, tags, decompress=decompress, root_label=root_label) + return tree + +def _node2dict(tree): + children = [_node2dict(child) for child in tree.children] + leaves = tree.get_yield() + node = { + 'is_head' : tree.is_head, + 'span' : {'from' : tree.from_index, 'to' : tree.to_index}, + } + if tree.deprel is not None: + node['deprel'] = tree.deprel + if tree.attributes: + node['attributes'] = tree.attributes + if children: + node.update({ + 'category' : tree.category, + 'children' : children, + }) + else: + node.update(dict(zip(('orth', 'base', 'tag'), tree.category))) + return node + +def tree2dict(tree, metadata={}): + return {'tree' : _node2dict(tree), 'metadata' : metadata} diff --git b/neural_parser/training.py a/neural_parser/training.py new file mode 100644 index 0000000..04d0201 --- /dev/null +++ a/neural_parser/training.py @@ -0,0 +1,180 @@ +import os +import subprocess + +from itertools import chain + +import tensorflow as tf +from tensorflow.keras import backend + +from datasets import Dataset +from datasets.features import Features +from transformers import AutoTokenizer +from transformers.modeling_tf_utils import TFTokenClassificationLoss +from transformers.tf_utils import shape_list + +from .constituency_parser import ConstituencyParser +from .data_utils import DataCollator +from .dataset_utils import bert_tokenize_and_align +from .constants import ( + FIRST, + MASK_VALUE, + TOKENS, + SPINES, + ANCHORS, + ANCHOR_HS, +) + +class AvgAccuracy(tf.keras.callbacks.Callback): + def __init__(self): + super(AvgAccuracy, self).__init__() + def on_epoch_begin(self, epoch, logs={}): + return + def on_epoch_end(self, epoch, logs={}): + accs = [] + val_accs = [] + for k, v in logs.items(): + if k.endswith('_acc'): + if k.startswith('val_'): + val_accs.append(v) + else: + accs.append(v) + logs['avg_acc'] = sum(accs) / len(accs) + logs['val_avg_acc'] = sum(val_accs) / len(val_accs) + +def _masked_sparse_categorical_accuracy(y_true, y_pred): + y_pred = tf.convert_to_tensor(y_pred) + y_true = tf.convert_to_tensor(y_true) + y_pred_rank = y_pred.shape.ndims + y_true_rank = y_true.shape.ndims + # If the shape of y_true is (num_samples, 1), squeeze to (num_samples,) + if (y_true_rank is not None) and (y_pred_rank is not None) and (len( + backend.int_shape(y_true)) == len(backend.int_shape(y_pred))): + y_true = tf.squeeze(y_true, [-1]) + y_pred = tf.compat.v1.argmax(y_pred, axis=-1) + mask = tf.reshape(y_true, (-1,)) != MASK_VALUE + y_true = tf.boolean_mask(tf.reshape(y_true, (-1,)), mask) + y_pred = tf.boolean_mask(tf.reshape(y_pred, (-1,)), mask) + # If the predicted output and actual output types don't match, force cast them + # to match. + if backend.dtype(y_pred) != backend.dtype(y_true): + y_pred = tf.cast(y_pred, backend.dtype(y_true)) + ret = tf.cast(tf.equal(y_true, y_pred), backend.floatx()) + return ret + +class Trainer(object): + + def __init__( + self, + bert_path, + dataset, + batch_size=32, + ): + self.bert_path = bert_path + self.dataset = dataset + self.masking_strategy = FIRST + self.batch_size = batch_size + + self.categories = [SPINES, ANCHORS, ANCHOR_HS] + + self.features = Features({cat : self.dataset['train'].features[cat] for cat in self.categories}) + + print('Loading BERT tokenizer...') + self.bert_tokenizer = AutoTokenizer.from_pretrained(self.bert_path) + + print('Preprocessing the dataset for BERT...') + self.dataset = self.dataset.map(lambda x: bert_tokenize_and_align(x, self.bert_tokenizer, self.masking_strategy)) + + self.train_data = self._prepare_tf_data(self.dataset['train'], shuffle=True) + self.dev_data = self._prepare_tf_data(self.dataset['validation']) + + def _prepare_tf_data(self, dataset, shuffle=False): + collator = DataCollator(self.bert_tokenizer, self.features) + return Dataset.to_tf_dataset( + dataset, + columns=['input_ids', 'token_type_ids', 'attention_mask'], + label_cols=self.categories, + batch_size=self.batch_size, shuffle=shuffle, collate_fn=collator + ) + + def _prepare_output_dir(self, path): + if not os.path.exists(path): + subprocess.call(f'mkdir {path}', shell=True) + else: + if not os.path.isdir(path): + raise ValueError(f'{path} is not a directory') + elif os.listdir(path): + print(f'emptying {path}') + subprocess.call(f'rm -r {path}/*', shell=True) + + + def _make_callbacks(self, log_dir): + callbacks = [ + AvgAccuracy(), + tf.keras.callbacks.EarlyStopping(monitor='val_avg_acc', patience=4, verbose=1, restore_best_weights=True) + ] + if log_dir is not None: + callbacks.append(tf.keras.callbacks.TensorBoard(log_dir=log_dir, histogram_freq=0, update_freq=50)) + return callbacks + + def train(self, epochs=10, lr=0.00001, log_dir=None, model_dir=None): + + if log_dir is not None: + self._prepare_output_dir(log_dir) + if model_dir is not None: + self._prepare_output_dir(model_dir) + + parser = ConstituencyParser.create( + self.bert_path, + self.features, + bert_tokenizer=self.bert_tokenizer + ) + + parser.model.config.tf_legacy_loss = True + hf_loss = parser.model.hf_compute_loss + + def _loss(labels, logits): + print('LABELS:', labels) + print('LOGITS:', logits) + l = hf_loss(labels, logits) + print('LOSS:', l) + return l + + # wrap in eager execution so that tensor values can be printed + def debug_loss(y_true, y_pred): + return tf.py_function(func=_loss, inp=[tf.cast(y_true, tf.float32), y_pred], Tout=tf.float32) + + loss = hf_loss + #loss = debug_loss + + accuracy_metric = lambda: tf.keras.metrics.MeanMetricWrapper( + fn=_masked_sparse_categorical_accuracy, name='acc' + ) + + metrics = {cat : [accuracy_metric()] for cat in self.categories} + + losses = {cat : loss for cat in self.categories} + + initial_epoch = 0 + + parser.model.compile( + optimizer=tf.keras.optimizers.Adam(learning_rate=lr), + loss=losses, + metrics=metrics + ) + parser.model.fit( + x=self.train_data, + validation_data=self.dev_data, + epochs=epochs, + callbacks=self._make_callbacks(log_dir), + initial_epoch=initial_epoch, + ) + + if model_dir is not None: + parser.save(model_dir) + with open(f'{model_dir}/trainer.info', 'w') as f: + print(f'dataset: {self.dataset}', file=f) + print(f'batch_size: {self.batch_size}', file=f) + print(f'epochs: {epochs}', file=f) + print(f'lr: {lr}', file=f) + + return parser